<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
<meta name="generator" content="Doxygen 1.8.11"/>
<title>CUTLASS: default_mma_core_simt.h Source File</title>
<link href="tabs.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="jquery.js"></script>
<script type="text/javascript" src="dynsections.js"></script>
<link href="search/search.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="search/searchdata.js"></script>
<script type="text/javascript" src="search/search.js"></script>
<script type="text/javascript">
  $(document).ready(function() { init_search(); });
</script>
<script type="text/x-mathjax-config">
  MathJax.Hub.Config({
    extensions: ["tex2jax.js"],
    jax: ["input/TeX","output/HTML-CSS"],
});
</script><script type="text/javascript" src="http://cdn.mathjax.org/mathjax/latest/MathJax.js"></script>
<link href="doxygen.css" rel="stylesheet" type="text/css" />
</head>
<body>
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
<div id="titlearea">
<table cellspacing="0" cellpadding="0">
 <tbody>
 <tr style="height: 56px;">
  <td id="projectlogo"><img alt="Logo" src="cutlass-logo-small.png"/></td>
  <td id="projectalign" style="padding-left: 0.5em;">
   <div id="projectname">CUTLASS
   </div>
   <div id="projectbrief">CUDA Templates for Linear Algebra Subroutines and Solvers</div>
  </td>
 </tr>
 </tbody>
</table>
</div>
<!-- end header part -->
<!-- Generated by Doxygen 1.8.11 -->
<script type="text/javascript">
var searchBox = new SearchBox("searchBox", "search",false,'Search');
</script>
  <div id="navrow1" class="tabs">
    <ul class="tablist">
      <li><a href="index.html"><span>Main&#160;Page</span></a></li>
      <li><a href="modules.html"><span>Modules</span></a></li>
      <li><a href="namespaces.html"><span>Namespaces</span></a></li>
      <li><a href="annotated.html"><span>Classes</span></a></li>
      <li class="current"><a href="files.html"><span>Files</span></a></li>
      <li>
        <div id="MSearchBox" class="MSearchBoxInactive">
        <span class="left">
          <img id="MSearchSelect" src="search/mag_sel.png"
               onmouseover="return searchBox.OnSearchSelectShow()"
               onmouseout="return searchBox.OnSearchSelectHide()"
               alt=""/>
          <input type="text" id="MSearchField" value="Search" accesskey="S"
               onfocus="searchBox.OnSearchFieldFocus(true)" 
               onblur="searchBox.OnSearchFieldFocus(false)" 
               onkeyup="searchBox.OnSearchFieldChange(event)"/>
          </span><span class="right">
            <a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
          </span>
        </div>
      </li>
    </ul>
  </div>
  <div id="navrow2" class="tabs2">
    <ul class="tablist">
      <li><a href="files.html"><span>File&#160;List</span></a></li>
      <li><a href="globals.html"><span>File&#160;Members</span></a></li>
    </ul>
  </div>
<!-- window showing the filter options -->
<div id="MSearchSelectWindow"
     onmouseover="return searchBox.OnSearchSelectShow()"
     onmouseout="return searchBox.OnSearchSelectHide()"
     onkeydown="return searchBox.OnSearchSelectKey(event)">
</div>

<!-- iframe showing the search results (closed by default) -->
<div id="MSearchResultsWindow">
<iframe src="javascript:void(0)" frameborder="0" 
        name="MSearchResults" id="MSearchResults">
</iframe>
</div>

<div id="nav-path" class="navpath">
  <ul>
<li class="navelem"><a class="el" href="dir_d44c64559bbebec7f509842c48db8b23.html">include</a></li><li class="navelem"><a class="el" href="dir_6baf2bb612a2f0daa69af3101ede80a1.html">cutlass</a></li><li class="navelem"><a class="el" href="dir_9aa36bd9cfad59a1f88859a38871c977.html">gemm</a></li><li class="navelem"><a class="el" href="dir_ffb18c781d484e5d1c680f712f01a439.html">threadblock</a></li>  </ul>
</div>
</div><!-- top -->
<div class="header">
  <div class="headertitle">
<div class="title">default_mma_core_simt.h</div>  </div>
</div><!--header-->
<div class="contents">
<a href="default__mma__core__simt_8h.html">Go to the documentation of this file.</a><div class="fragment"><div class="line"><a name="l00001"></a><span class="lineno">    1</span>&#160;<span class="comment">/***************************************************************************************************</span></div><div class="line"><a name="l00002"></a><span class="lineno">    2</span>&#160;<span class="comment"> * Copyright (c) 2017-2019, NVIDIA CORPORATION.  All rights reserved.</span></div><div class="line"><a name="l00003"></a><span class="lineno">    3</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00004"></a><span class="lineno">    4</span>&#160;<span class="comment"> * Redistribution and use in source and binary forms, with or without modification, are permitted</span></div><div class="line"><a name="l00005"></a><span class="lineno">    5</span>&#160;<span class="comment"> * provided that the following conditions are met:</span></div><div class="line"><a name="l00006"></a><span class="lineno">    6</span>&#160;<span class="comment"> *     * Redistributions of source code must retain the above copyright notice, this list of</span></div><div class="line"><a name="l00007"></a><span class="lineno">    7</span>&#160;<span class="comment"> *       conditions and the following disclaimer.</span></div><div class="line"><a name="l00008"></a><span class="lineno">    8</span>&#160;<span class="comment"> *     * Redistributions in binary form must reproduce the above copyright notice, this list of</span></div><div class="line"><a name="l00009"></a><span class="lineno">    9</span>&#160;<span class="comment"> *       conditions and the following disclaimer in the documentation and/or other materials</span></div><div class="line"><a name="l00010"></a><span class="lineno">   10</span>&#160;<span class="comment"> *       provided with the distribution.</span></div><div class="line"><a name="l00011"></a><span class="lineno">   11</span>&#160;<span class="comment"> *     * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used</span></div><div class="line"><a name="l00012"></a><span class="lineno">   12</span>&#160;<span class="comment"> *       to endorse or promote products derived from this software without specific prior written</span></div><div class="line"><a name="l00013"></a><span class="lineno">   13</span>&#160;<span class="comment"> *       permission.</span></div><div class="line"><a name="l00014"></a><span class="lineno">   14</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00015"></a><span class="lineno">   15</span>&#160;<span class="comment"> * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS &quot;AS IS&quot; AND ANY EXPRESS OR</span></div><div class="line"><a name="l00016"></a><span class="lineno">   16</span>&#160;<span class="comment"> * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND</span></div><div class="line"><a name="l00017"></a><span class="lineno">   17</span>&#160;<span class="comment"> * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE</span></div><div class="line"><a name="l00018"></a><span class="lineno">   18</span>&#160;<span class="comment"> * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,</span></div><div class="line"><a name="l00019"></a><span class="lineno">   19</span>&#160;<span class="comment"> * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;</span></div><div class="line"><a name="l00020"></a><span class="lineno">   20</span>&#160;<span class="comment"> * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,</span></div><div class="line"><a name="l00021"></a><span class="lineno">   21</span>&#160;<span class="comment"> * STRICT LIABILITY, OR TOR (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE</span></div><div class="line"><a name="l00022"></a><span class="lineno">   22</span>&#160;<span class="comment"> * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.</span></div><div class="line"><a name="l00023"></a><span class="lineno">   23</span>&#160;<span class="comment"> *</span></div><div class="line"><a name="l00024"></a><span class="lineno">   24</span>&#160;<span class="comment"> **************************************************************************************************/</span></div><div class="line"><a name="l00032"></a><span class="lineno">   32</span>&#160;<span class="preprocessor">#pragma once</span></div><div class="line"><a name="l00033"></a><span class="lineno">   33</span>&#160;</div><div class="line"><a name="l00034"></a><span class="lineno">   34</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="cutlass_8h.html">cutlass/cutlass.h</a>&quot;</span></div><div class="line"><a name="l00035"></a><span class="lineno">   35</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="array_8h.html">cutlass/array.h</a>&quot;</span></div><div class="line"><a name="l00036"></a><span class="lineno">   36</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="fast__math_8h.html">cutlass/fast_math.h</a>&quot;</span></div><div class="line"><a name="l00037"></a><span class="lineno">   37</span>&#160;</div><div class="line"><a name="l00038"></a><span class="lineno">   38</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="numeric__types_8h.html">cutlass/numeric_types.h</a>&quot;</span></div><div class="line"><a name="l00039"></a><span class="lineno">   39</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="matrix__shape_8h.html">cutlass/matrix_shape.h</a>&quot;</span></div><div class="line"><a name="l00040"></a><span class="lineno">   40</span>&#160;</div><div class="line"><a name="l00041"></a><span class="lineno">   41</span>&#160;</div><div class="line"><a name="l00042"></a><span class="lineno">   42</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="pitch__linear__thread__map_8h.html">cutlass/transform/pitch_linear_thread_map.h</a>&quot;</span></div><div class="line"><a name="l00043"></a><span class="lineno">   43</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="regular__tile__iterator__pitch__linear_8h.html">cutlass/transform/threadblock/regular_tile_iterator_pitch_linear.h</a>&quot;</span></div><div class="line"><a name="l00044"></a><span class="lineno">   44</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="regular__tile__iterator__pitch__linear__2dthreadtile_8h.html">cutlass/transform/threadblock/regular_tile_iterator_pitch_linear_2dthreadtile.h</a>&quot;</span></div><div class="line"><a name="l00045"></a><span class="lineno">   45</span>&#160;</div><div class="line"><a name="l00046"></a><span class="lineno">   46</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="mma__simt__policy_8h.html">cutlass/gemm/warp/mma_simt_policy.h</a>&quot;</span></div><div class="line"><a name="l00047"></a><span class="lineno">   47</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="mma__simt_8h.html">cutlass/gemm/warp/mma_simt.h</a>&quot;</span></div><div class="line"><a name="l00048"></a><span class="lineno">   48</span>&#160;<span class="preprocessor">#include &quot;<a class="code" href="default__mma__core_8h.html">cutlass/gemm/threadblock/default_mma_core.h</a>&quot;</span></div><div class="line"><a name="l00049"></a><span class="lineno">   49</span>&#160;</div><div class="line"><a name="l00051"></a><span class="lineno">   51</span>&#160;</div><div class="line"><a name="l00052"></a><span class="lineno">   52</span>&#160;<span class="keyword">namespace </span><a class="code" href="namespacecutlass.html">cutlass</a> {</div><div class="line"><a name="l00053"></a><span class="lineno">   53</span>&#160;<span class="keyword">namespace </span>gemm {</div><div class="line"><a name="l00054"></a><span class="lineno">   54</span>&#160;<span class="keyword">namespace </span>threadblock {</div><div class="line"><a name="l00055"></a><span class="lineno">   55</span>&#160;</div><div class="line"><a name="l00056"></a><span class="lineno"><a class="line" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html">   56</a></span>&#160;<span class="keyword">namespace </span>detail {</div><div class="line"><a name="l00057"></a><span class="lineno">   57</span>&#160;</div><div class="line"><a name="l00058"></a><span class="lineno">   58</span>&#160;<span class="comment">// convert a WarpShape which is the whole tile of elements into warp num threads.</span></div><div class="line"><a name="l00059"></a><span class="lineno">   59</span>&#160;<span class="comment">// The goal is for each thread&#39;s tile of elements to be as square as possible</span></div><div class="line"><a name="l00060"></a><span class="lineno">   60</span>&#160;<span class="comment">// for performance (4x4 will be faster than 2x8).</span></div><div class="line"><a name="l00061"></a><span class="lineno">   61</span>&#160;<span class="keyword">template</span>&lt;<span class="keyword">typename</span> WarpShape&gt;</div><div class="line"><a name="l00062"></a><span class="lineno"><a class="line" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a69a9003a33867ce73f81c37b7414c915">   62</a></span>&#160;<a class="code" href="platform_8h.html#a72f0657181cca64b44eb186b707eb380">constexpr</a> <span class="keywordtype">int</span> <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a69a9003a33867ce73f81c37b7414c915">simt_get_warp_threads_m</a>() {</div><div class="line"><a name="l00063"></a><span class="lineno">   63</span>&#160;    <span class="keywordflow">return</span> (WarpShape::kM &gt; WarpShape::kN) ? 8 : 4;</div><div class="line"><a name="l00064"></a><span class="lineno">   64</span>&#160;}</div><div class="line"><a name="l00065"></a><span class="lineno">   65</span>&#160;</div><div class="line"><a name="l00067"></a><span class="lineno"><a class="line" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">   67</a></span>&#160;<a class="code" href="platform_8h.html#a72f0657181cca64b44eb186b707eb380">constexpr</a> <span class="keywordtype">int</span> <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">simt_transpose_padding</a>(<span class="keywordtype">int</span> threads, <span class="keywordtype">int</span> crosswise, <span class="keywordtype">int</span> size_in_bits) {</div><div class="line"><a name="l00068"></a><span class="lineno">   68</span>&#160;  <span class="keywordflow">return</span> (size_in_bits &gt;= 32 ?</div><div class="line"><a name="l00069"></a><span class="lineno">   69</span>&#160;      threads / crosswise / (size_in_bits / 32) :</div><div class="line"><a name="l00070"></a><span class="lineno">   70</span>&#160;      threads / crosswise * (32 / size_in_bits)</div><div class="line"><a name="l00071"></a><span class="lineno">   71</span>&#160;  );</div><div class="line"><a name="l00072"></a><span class="lineno">   72</span>&#160;}</div><div class="line"><a name="l00073"></a><span class="lineno">   73</span>&#160;</div><div class="line"><a name="l00074"></a><span class="lineno">   74</span>&#160;}</div><div class="line"><a name="l00075"></a><span class="lineno">   75</span>&#160;</div><div class="line"><a name="l00077"></a><span class="lineno">   77</span>&#160;</div><div class="line"><a name="l00085"></a><span class="lineno">   85</span>&#160;<span class="keyword">template</span> &lt;</div><div class="line"><a name="l00088"></a><span class="lineno">   88</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l00090"></a><span class="lineno">   90</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l00092"></a><span class="lineno">   92</span>&#160;    <span class="keyword">typename</span> ElementA_,</div><div class="line"><a name="l00094"></a><span class="lineno">   94</span>&#160;    <span class="keyword">typename</span> ElementB_,</div><div class="line"><a name="l00096"></a><span class="lineno">   96</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l00098"></a><span class="lineno">   98</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l00100"></a><span class="lineno">  100</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l00101"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html">  101</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 1&gt;, ElementA_,</div><div class="line"><a name="l00102"></a><span class="lineno">  102</span>&#160;                      layout::ColumnMajor, ElementB_, <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>,</div><div class="line"><a name="l00103"></a><span class="lineno">  103</span>&#160;                      ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l00104"></a><span class="lineno">  104</span>&#160;                     &gt; {</div><div class="line"><a name="l00105"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a43fa0507a4d4bd8ca7df069858f910e6">  105</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a43fa0507a4d4bd8ca7df069858f910e6">Shape</a> = Shape_;</div><div class="line"><a name="l00106"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af8139bed1d2a3d23e9d4e1790a058d01">  106</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af8139bed1d2a3d23e9d4e1790a058d01">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l00107"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a88e589a8ab9399b4116b98bbb872d133">  107</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 1&gt;</a>;</div><div class="line"><a name="l00108"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af0afef329d873475ac2a4eba05bd943c">  108</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af0afef329d873475ac2a4eba05bd943c">ElementA</a> = ElementA_;</div><div class="line"><a name="l00109"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#accc6d889c070c36baf7d471d6982ccef">  109</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00110"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aaf221ce787e11cf3edcb49fc2afec46d">  110</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aaf221ce787e11cf3edcb49fc2afec46d">ElementB</a> = ElementB_;</div><div class="line"><a name="l00111"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a8ac8547ec04936655980a0e5f270815a">  111</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00112"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a562143e6b199064cd539bde597ec3999">  112</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a562143e6b199064cd539bde597ec3999">ElementC</a> = ElementC_;</div><div class="line"><a name="l00113"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a926109870af5f4d9120ce5c98bbed2b6">  113</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a926109870af5f4d9120ce5c98bbed2b6">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l00114"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a1d91b3f73b2941d84499f28f38b2fcfb">  114</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a1d91b3f73b2941d84499f28f38b2fcfb">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l00115"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#ab949799d5ae5e367142e0c4370241fc6">  115</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l00116"></a><span class="lineno">  116</span>&#160;</div><div class="line"><a name="l00118"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aa63507fa81a746d9d88363a977018c8b">  118</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aa63507fa81a746d9d88363a977018c8b">Operator</a> = Operator_;</div><div class="line"><a name="l00119"></a><span class="lineno">  119</span>&#160;</div><div class="line"><a name="l00121"></a><span class="lineno">  121</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l00122"></a><span class="lineno">  122</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l00123"></a><span class="lineno">  123</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l00124"></a><span class="lineno">  124</span>&#160;    PartitionsK</div><div class="line"><a name="l00125"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a1d85646ac581fd8e5ae9c597a16aea1d">  125</a></span>&#160;  &gt;;</div><div class="line"><a name="l00126"></a><span class="lineno">  126</span>&#160;</div><div class="line"><a name="l00127"></a><span class="lineno">  127</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l00128"></a><span class="lineno">  128</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00129"></a><span class="lineno">  129</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l00130"></a><span class="lineno">  130</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l00131"></a><span class="lineno">  131</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l00132"></a><span class="lineno">  132</span>&#160;  );</div><div class="line"><a name="l00133"></a><span class="lineno">  133</span>&#160;</div><div class="line"><a name="l00135"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a2d8ac452ce8d9fa0fe416fd61bff3db4">  135</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l00136"></a><span class="lineno">  136</span>&#160;</div><div class="line"><a name="l00138"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a42736c96be2a22cf7530a574a2464920">  138</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l00139"></a><span class="lineno">  139</span>&#160;</div><div class="line"><a name="l00140"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a1fedb6678cf6a2ba73ad0baa66af319f">  140</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kElementsPerAccess = 1;</div><div class="line"><a name="l00141"></a><span class="lineno">  141</span>&#160;</div><div class="line"><a name="l00142"></a><span class="lineno">  142</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00143"></a><span class="lineno">  143</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l00144"></a><span class="lineno">  144</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00145"></a><span class="lineno">  145</span>&#160;</div><div class="line"><a name="l00146"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a57a9e5da93f0d35a2ddbd33a6aa5ac01">  146</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">SmemLayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00147"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a718759dee390856a1e05dac7ee2eeba8">  147</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">SmemLayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00148"></a><span class="lineno">  148</span>&#160;</div><div class="line"><a name="l00149"></a><span class="lineno">  149</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00150"></a><span class="lineno">  150</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l00151"></a><span class="lineno">  151</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00152"></a><span class="lineno">  152</span>&#160;</div><div class="line"><a name="l00154"></a><span class="lineno">  154</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00155"></a><span class="lineno">  155</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;Shape::kM, Shape::kK&gt;</a>,</div><div class="line"><a name="l00156"></a><span class="lineno">  156</span>&#160;    kThreads,</div><div class="line"><a name="l00157"></a><span class="lineno">  157</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00158"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a26456fb7a61b7ace3225fc91e9b1f68c">  158</a></span>&#160;  &gt;;</div><div class="line"><a name="l00159"></a><span class="lineno">  159</span>&#160;</div><div class="line"><a name="l00161"></a><span class="lineno">  161</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00162"></a><span class="lineno">  162</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;Shape::kM, Shape::kK&gt;</a>, </div><div class="line"><a name="l00163"></a><span class="lineno">  163</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af0afef329d873475ac2a4eba05bd943c">ElementA</a>, </div><div class="line"><a name="l00164"></a><span class="lineno">  164</span>&#160;    <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">SmemLayoutA</a>,</div><div class="line"><a name="l00165"></a><span class="lineno">  165</span>&#160;    1,</div><div class="line"><a name="l00166"></a><span class="lineno">  166</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapA</a></div><div class="line"><a name="l00167"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aa2db12388e55069e3b0fe2af9954e1a1">  167</a></span>&#160;  &gt;;</div><div class="line"><a name="l00168"></a><span class="lineno">  168</span>&#160;</div><div class="line"><a name="l00170"></a><span class="lineno">  170</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00171"></a><span class="lineno">  171</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;Shape::kN, Shape::kK&gt;</a>,</div><div class="line"><a name="l00172"></a><span class="lineno">  172</span>&#160;    kThreads,</div><div class="line"><a name="l00173"></a><span class="lineno">  173</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00174"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a09be4f20512d02f18452dab77298b4da">  174</a></span>&#160;  &gt;;</div><div class="line"><a name="l00175"></a><span class="lineno">  175</span>&#160;</div><div class="line"><a name="l00177"></a><span class="lineno">  177</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00178"></a><span class="lineno">  178</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;Shape::kK, Shape::kN&gt;</a>, </div><div class="line"><a name="l00179"></a><span class="lineno">  179</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aaf221ce787e11cf3edcb49fc2afec46d">ElementB</a>, </div><div class="line"><a name="l00180"></a><span class="lineno">  180</span>&#160;    <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">SmemLayoutB</a>,</div><div class="line"><a name="l00181"></a><span class="lineno">  181</span>&#160;    0,</div><div class="line"><a name="l00182"></a><span class="lineno">  182</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapB</a></div><div class="line"><a name="l00183"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a16900d537540532f4c5efefcc543416b">  183</a></span>&#160;  &gt;;</div><div class="line"><a name="l00184"></a><span class="lineno">  184</span>&#160;</div><div class="line"><a name="l00185"></a><span class="lineno">  185</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00186"></a><span class="lineno">  186</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l00187"></a><span class="lineno">  187</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00188"></a><span class="lineno">  188</span>&#160;</div><div class="line"><a name="l00189"></a><span class="lineno">  189</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l00190"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a216700282fe9735796ae0d1f0f79af7a">  190</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l00191"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#adfcd79b6e1bb378cb44bcb24a415e0f7">  191</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l00192"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a79b5f6cdeda5d0b3c309d1fcf45d9803">  192</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l00193"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a31d804e96a103165a7c4e7b423f05e26">  193</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l00194"></a><span class="lineno">  194</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l00195"></a><span class="lineno">  195</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l00196"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a1f24faddd5fae8367bad4af8ff2fea08">  196</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l00197"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#ae3b7f8dde87eb21afa918922fdf82277">  197</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l00198"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a849667f66d0bd89addd0abdda5325460">  198</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l00199"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a1b3217db1d2c0ed2a5f6ec128a2f240d">  199</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsA, ThreadTileM);</div><div class="line"><a name="l00200"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a314973e2cec1559f54505965cf3c7cdc">  200</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsB, ThreadTileN);</div><div class="line"><a name="l00201"></a><span class="lineno">  201</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l00202"></a><span class="lineno">  202</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l00203"></a><span class="lineno">  203</span>&#160;      LaneM,</div><div class="line"><a name="l00204"></a><span class="lineno">  204</span>&#160;      LaneN,</div><div class="line"><a name="l00205"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a830c544f4fed1d21e6cb9d9e39b2f55e">  205</a></span>&#160;      1&gt;;</div><div class="line"><a name="l00206"></a><span class="lineno">  206</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l00207"></a><span class="lineno">  207</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l00208"></a><span class="lineno">  208</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">cutlass::layout::RowMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l00209"></a><span class="lineno">  209</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l00210"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a5e6932a753e9283f543e87b6a4f7d40b">  210</a></span>&#160;  &gt;;</div><div class="line"><a name="l00211"></a><span class="lineno">  211</span>&#160;</div><div class="line"><a name="l00212"></a><span class="lineno">  212</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l00213"></a><span class="lineno">  213</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af8139bed1d2a3d23e9d4e1790a058d01">WarpShape</a>,    </div><div class="line"><a name="l00214"></a><span class="lineno">  214</span>&#160;    ElementA,     </div><div class="line"><a name="l00215"></a><span class="lineno">  215</span>&#160;    SmemLayoutA,  </div><div class="line"><a name="l00216"></a><span class="lineno">  216</span>&#160;    ElementB,     </div><div class="line"><a name="l00217"></a><span class="lineno">  217</span>&#160;    SmemLayoutB,  </div><div class="line"><a name="l00218"></a><span class="lineno">  218</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a562143e6b199064cd539bde597ec3999">ElementC</a>,     </div><div class="line"><a name="l00219"></a><span class="lineno">  219</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a926109870af5f4d9120ce5c98bbed2b6">LayoutC</a>,      </div><div class="line"><a name="l00220"></a><span class="lineno">  220</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>        </div><div class="line"><a name="l00221"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#accc92ce0cfc6c8e19420557d8b888edb">  221</a></span>&#160;    &gt;;            </div><div class="line"><a name="l00222"></a><span class="lineno">  222</span>&#160;</div><div class="line"><a name="l00224"></a><span class="lineno">  224</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a05d5677b44fd111bfe6ebcc6fb7d1676">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a05d5677b44fd111bfe6ebcc6fb7d1676">MmaPolicy</a>&lt;</div><div class="line"><a name="l00225"></a><span class="lineno">  225</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l00226"></a><span class="lineno">  226</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, 0&gt;</a>,</div><div class="line"><a name="l00227"></a><span class="lineno">  227</span>&#160;    MatrixShape&lt;0, 0&gt;,</div><div class="line"><a name="l00228"></a><span class="lineno">  228</span>&#160;    WarpCount::kK</div><div class="line"><a name="l00229"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a05d5677b44fd111bfe6ebcc6fb7d1676">  229</a></span>&#160;  &gt;;</div><div class="line"><a name="l00230"></a><span class="lineno">  230</span>&#160;};</div><div class="line"><a name="l00231"></a><span class="lineno">  231</span>&#160;</div><div class="line"><a name="l00233"></a><span class="lineno">  233</span>&#160;</div><div class="line"><a name="l00241"></a><span class="lineno">  241</span>&#160;<span class="keyword">template</span> &lt;</div><div class="line"><a name="l00244"></a><span class="lineno">  244</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l00246"></a><span class="lineno">  246</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l00248"></a><span class="lineno">  248</span>&#160;    <span class="keyword">typename</span> ElementA_,</div><div class="line"><a name="l00250"></a><span class="lineno">  250</span>&#160;    <span class="keyword">typename</span> ElementB_,</div><div class="line"><a name="l00252"></a><span class="lineno">  252</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l00254"></a><span class="lineno">  254</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l00256"></a><span class="lineno">  256</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l00257"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html">  257</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 1&gt;, ElementA_,</div><div class="line"><a name="l00258"></a><span class="lineno">  258</span>&#160;                      layout::RowMajor, ElementB_, <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>,</div><div class="line"><a name="l00259"></a><span class="lineno">  259</span>&#160;                      ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l00260"></a><span class="lineno">  260</span>&#160;                     &gt; {</div><div class="line"><a name="l00261"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a6c7b4a920e6d2ab6cf53d51dc410f74f">  261</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a6c7b4a920e6d2ab6cf53d51dc410f74f">Shape</a> = Shape_;</div><div class="line"><a name="l00262"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a1bc7903bc348e342702a6f7e314be337">  262</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a1bc7903bc348e342702a6f7e314be337">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l00263"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#af529eb97a1e2d46e301fbaf1dbf4c89c">  263</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 1&gt;</a>;</div><div class="line"><a name="l00264"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a2dbfa6ca02fef067e837cb3201e29c52">  264</a></span>&#160;  <span class="keyword">using</span> ElementA = ElementA_;</div><div class="line"><a name="l00265"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a8c50192463a45aae57d1d4d6f3a75723">  265</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00266"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a6bab5c5d1141ed336fd1bd4fe455e715">  266</a></span>&#160;  <span class="keyword">using</span> ElementB = ElementB_;</div><div class="line"><a name="l00267"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#acd277c26115341aa9dd95f682cd98bed">  267</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00268"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a85f9b714299218c989d6bd1b48166758">  268</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a85f9b714299218c989d6bd1b48166758">ElementC</a> = ElementC_;</div><div class="line"><a name="l00269"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#abbf4045091090bcaf32905afaefb01c5">  269</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#abbf4045091090bcaf32905afaefb01c5">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l00270"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ab593ff2fb5b33cc946b19aab6b1e64bf">  270</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ab593ff2fb5b33cc946b19aab6b1e64bf">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l00271"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ae2344ae8e3350817d9a2275936685165">  271</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l00272"></a><span class="lineno">  272</span>&#160;</div><div class="line"><a name="l00274"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a812562a7feb033d7c554ab6d86c30388">  274</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a812562a7feb033d7c554ab6d86c30388">Operator</a> = Operator_;</div><div class="line"><a name="l00275"></a><span class="lineno">  275</span>&#160;</div><div class="line"><a name="l00277"></a><span class="lineno">  277</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l00278"></a><span class="lineno">  278</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l00279"></a><span class="lineno">  279</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l00280"></a><span class="lineno">  280</span>&#160;    PartitionsK</div><div class="line"><a name="l00281"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a7c561dee13f99e46d436c6dc3755c766">  281</a></span>&#160;  &gt;;</div><div class="line"><a name="l00282"></a><span class="lineno">  282</span>&#160;</div><div class="line"><a name="l00283"></a><span class="lineno">  283</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l00284"></a><span class="lineno">  284</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00285"></a><span class="lineno">  285</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l00286"></a><span class="lineno">  286</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l00287"></a><span class="lineno">  287</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l00288"></a><span class="lineno">  288</span>&#160;  );</div><div class="line"><a name="l00289"></a><span class="lineno">  289</span>&#160;</div><div class="line"><a name="l00291"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a0523fef53729c2e2431783b546f558fb">  291</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l00292"></a><span class="lineno">  292</span>&#160;</div><div class="line"><a name="l00294"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a2144315db649fe20ba9d42f88aee510b">  294</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l00295"></a><span class="lineno">  295</span>&#160;  </div><div class="line"><a name="l00296"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ac6cd2c817d78838775074fae95642e5c">  296</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kElementsPerAccess = 1;</div><div class="line"><a name="l00297"></a><span class="lineno">  297</span>&#160;</div><div class="line"><a name="l00298"></a><span class="lineno">  298</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00299"></a><span class="lineno">  299</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l00300"></a><span class="lineno">  300</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00301"></a><span class="lineno">  301</span>&#160;</div><div class="line"><a name="l00302"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#acd6c7ff3df9e030a3f439a012c5cc805">  302</a></span>&#160;  <span class="keyword">using</span> SmemLayoutA = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00303"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#af705d12303ebff1ba0af00899cc59858">  303</a></span>&#160;  <span class="keyword">using</span> SmemLayoutB = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00304"></a><span class="lineno">  304</span>&#160;</div><div class="line"><a name="l00305"></a><span class="lineno">  305</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00306"></a><span class="lineno">  306</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l00307"></a><span class="lineno">  307</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00308"></a><span class="lineno">  308</span>&#160;</div><div class="line"><a name="l00310"></a><span class="lineno">  310</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00311"></a><span class="lineno">  311</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;Shape::kK, Shape::kM&gt;</a>,</div><div class="line"><a name="l00312"></a><span class="lineno">  312</span>&#160;    kThreads,</div><div class="line"><a name="l00313"></a><span class="lineno">  313</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00314"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#aa2ba14171d7b2cef99a3db1419ea41fb">  314</a></span>&#160;  &gt;;</div><div class="line"><a name="l00315"></a><span class="lineno">  315</span>&#160;</div><div class="line"><a name="l00317"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a9ba2e0fae4f8bb596d326fce8e0d24b6">  317</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">transform::TransposePitchLinearThreadMapSimt&lt;IteratorThreadMapA&gt;</a>;</div><div class="line"><a name="l00318"></a><span class="lineno">  318</span>&#160;</div><div class="line"><a name="l00320"></a><span class="lineno">  320</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00321"></a><span class="lineno">  321</span>&#160;    MatrixShape&lt;Shape::kM, Shape::kK&gt;, </div><div class="line"><a name="l00322"></a><span class="lineno">  322</span>&#160;    ElementA, </div><div class="line"><a name="l00323"></a><span class="lineno">  323</span>&#160;    SmemLayoutA,</div><div class="line"><a name="l00324"></a><span class="lineno">  324</span>&#160;    1,</div><div class="line"><a name="l00325"></a><span class="lineno">  325</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapA</a> <span class="comment">// was IteratorThreadMapA</span></div><div class="line"><a name="l00326"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a9011a0ee09e3e04873315308a60d7bb1">  326</a></span>&#160;  &gt;;</div><div class="line"><a name="l00327"></a><span class="lineno">  327</span>&#160;</div><div class="line"><a name="l00329"></a><span class="lineno">  329</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00330"></a><span class="lineno">  330</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;Shape::kK, Shape::kN&gt;</a>,</div><div class="line"><a name="l00331"></a><span class="lineno">  331</span>&#160;    kThreads,</div><div class="line"><a name="l00332"></a><span class="lineno">  332</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00333"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ae7c43ed31d0702528c90f170bf772293">  333</a></span>&#160;  &gt;;</div><div class="line"><a name="l00334"></a><span class="lineno">  334</span>&#160;</div><div class="line"><a name="l00336"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#aae6130dafe7a06a8cca93d9707c0d5f2">  336</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">transform::TransposePitchLinearThreadMapSimt&lt;IteratorThreadMapB&gt;</a>;</div><div class="line"><a name="l00337"></a><span class="lineno">  337</span>&#160;</div><div class="line"><a name="l00339"></a><span class="lineno">  339</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00340"></a><span class="lineno">  340</span>&#160;    MatrixShape&lt;Shape::kK, Shape::kN&gt;, </div><div class="line"><a name="l00341"></a><span class="lineno">  341</span>&#160;    ElementB, </div><div class="line"><a name="l00342"></a><span class="lineno">  342</span>&#160;    SmemLayoutB,</div><div class="line"><a name="l00343"></a><span class="lineno">  343</span>&#160;    0,</div><div class="line"><a name="l00344"></a><span class="lineno">  344</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapB</a> <span class="comment">// was IteratorThreadMapA</span></div><div class="line"><a name="l00345"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ab70161620114c60ba3363cd2056948e4">  345</a></span>&#160;  &gt;;</div><div class="line"><a name="l00346"></a><span class="lineno">  346</span>&#160;</div><div class="line"><a name="l00347"></a><span class="lineno">  347</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00348"></a><span class="lineno">  348</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l00349"></a><span class="lineno">  349</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00350"></a><span class="lineno">  350</span>&#160;</div><div class="line"><a name="l00351"></a><span class="lineno">  351</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l00352"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#adb4ca21db8569aa3adf827fb6cb699d7">  352</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l00353"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a07ad995e1c5fe9e936f8a0d0cb36943f">  353</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l00354"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#aeaad0d41c32682cb7ea888cb5a692cde">  354</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l00355"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#af6822fb4c033f140c64ca2a2a9669e08">  355</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l00356"></a><span class="lineno">  356</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l00357"></a><span class="lineno">  357</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l00358"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a48f19989a6c2158f65b05003ecc9c677">  358</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l00359"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a278fba6345a2bc229581fda6087cf13b">  359</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l00360"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a530d1ff17f4ba7a12a4a237c08041467">  360</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l00361"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#abc08157c25c1aa3db1309114325b5894">  361</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsA, ThreadTileM);</div><div class="line"><a name="l00362"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a7e692bab9288ff9d3fdd0fa20028adcc">  362</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsB, ThreadTileN);</div><div class="line"><a name="l00363"></a><span class="lineno">  363</span>&#160;</div><div class="line"><a name="l00364"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#aeeab30cf98a08762b8f2d25db8e3dee2">  364</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingM = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>);</div><div class="line"><a name="l00365"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a08b6dcc32e0b9f2390f2663573bdf73b">  365</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingN = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>);</div><div class="line"><a name="l00366"></a><span class="lineno">  366</span>&#160;</div><div class="line"><a name="l00367"></a><span class="lineno">  367</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l00368"></a><span class="lineno">  368</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l00369"></a><span class="lineno">  369</span>&#160;      LaneM,</div><div class="line"><a name="l00370"></a><span class="lineno">  370</span>&#160;      LaneN,</div><div class="line"><a name="l00371"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a70bd709536f3452656041c40f0732fc0">  371</a></span>&#160;      1&gt;;</div><div class="line"><a name="l00372"></a><span class="lineno">  372</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l00373"></a><span class="lineno">  373</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l00374"></a><span class="lineno">  374</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">cutlass::layout::RowMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l00375"></a><span class="lineno">  375</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l00376"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a83650df8cb2ab42b64c369ec37b92871">  376</a></span>&#160;  &gt;;</div><div class="line"><a name="l00377"></a><span class="lineno">  377</span>&#160;</div><div class="line"><a name="l00378"></a><span class="lineno">  378</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l00379"></a><span class="lineno">  379</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a1bc7903bc348e342702a6f7e314be337">WarpShape</a>,      </div><div class="line"><a name="l00380"></a><span class="lineno">  380</span>&#160;      ElementA,       </div><div class="line"><a name="l00381"></a><span class="lineno">  381</span>&#160;      SmemLayoutA,    </div><div class="line"><a name="l00382"></a><span class="lineno">  382</span>&#160;      ElementB,       </div><div class="line"><a name="l00383"></a><span class="lineno">  383</span>&#160;      SmemLayoutB,    </div><div class="line"><a name="l00384"></a><span class="lineno">  384</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a85f9b714299218c989d6bd1b48166758">ElementC</a>,       </div><div class="line"><a name="l00385"></a><span class="lineno">  385</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#abbf4045091090bcaf32905afaefb01c5">LayoutC</a>,        </div><div class="line"><a name="l00386"></a><span class="lineno">  386</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>          </div><div class="line"><a name="l00387"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ad76d08483cf17fb0bbd2c5670a1a1613">  387</a></span>&#160;  &gt;;</div><div class="line"><a name="l00388"></a><span class="lineno">  388</span>&#160;</div><div class="line"><a name="l00390"></a><span class="lineno">  390</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a19db74df10235f4d5e36518bac33b4c6">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a19db74df10235f4d5e36518bac33b4c6">MmaPolicy</a>&lt;</div><div class="line"><a name="l00391"></a><span class="lineno">  391</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l00392"></a><span class="lineno">  392</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;kPaddingN, 0&gt;</a>,    <span class="comment">// skew for A matrix to avoid SMEM bank conflicts</span></div><div class="line"><a name="l00393"></a><span class="lineno">  393</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, kPaddingN&gt;</a>,    <span class="comment">// skew for B matrix to avoid SMEM bank conflicts</span></div><div class="line"><a name="l00394"></a><span class="lineno">  394</span>&#160;    WarpCount::kK</div><div class="line"><a name="l00395"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a19db74df10235f4d5e36518bac33b4c6">  395</a></span>&#160;  &gt;;</div><div class="line"><a name="l00396"></a><span class="lineno">  396</span>&#160;};</div><div class="line"><a name="l00397"></a><span class="lineno">  397</span>&#160;</div><div class="line"><a name="l00399"></a><span class="lineno">  399</span>&#160;</div><div class="line"><a name="l00407"></a><span class="lineno">  407</span>&#160;<span class="keyword">template</span> &lt;</div><div class="line"><a name="l00410"></a><span class="lineno">  410</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l00412"></a><span class="lineno">  412</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l00414"></a><span class="lineno">  414</span>&#160;    <span class="keyword">typename</span> ElementA_,</div><div class="line"><a name="l00416"></a><span class="lineno">  416</span>&#160;    <span class="keyword">typename</span> ElementB_,</div><div class="line"><a name="l00418"></a><span class="lineno">  418</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l00420"></a><span class="lineno">  420</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l00422"></a><span class="lineno">  422</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l00423"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html">  423</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 1&gt;, ElementA_,</div><div class="line"><a name="l00424"></a><span class="lineno">  424</span>&#160;                      layout::RowMajor, ElementB_, <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>, ElementC_,</div><div class="line"><a name="l00425"></a><span class="lineno">  425</span>&#160;                      LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l00426"></a><span class="lineno">  426</span>&#160;                     &gt; {</div><div class="line"><a name="l00427"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#ac514eda9ab5d8a522bf444f9f415d361">  427</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#ac514eda9ab5d8a522bf444f9f415d361">Shape</a> = Shape_;</div><div class="line"><a name="l00428"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aca4a8b44fb78de382813bd3bda11f5ce">  428</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aca4a8b44fb78de382813bd3bda11f5ce">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l00429"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#acd6237299856344061f05c8100b452cc">  429</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 1&gt;</a>;</div><div class="line"><a name="l00430"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aed2fa0b483ca496fa3becd970e07539d">  430</a></span>&#160;  <span class="keyword">using</span> ElementA = ElementA_;</div><div class="line"><a name="l00431"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a6c983b87a5a65a86b4d6360f6a679c2a">  431</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00432"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#acc47c2e63edb180761e6c9d0a89d6545">  432</a></span>&#160;  <span class="keyword">using</span> ElementB = ElementB_;</div><div class="line"><a name="l00433"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#ac2c4bacb4c37e02bd29db3c5e76232ff">  433</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00434"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aea4174e3f2e32dcd170dea50d5675369">  434</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aea4174e3f2e32dcd170dea50d5675369">ElementC</a> = ElementC_;</div><div class="line"><a name="l00435"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a6a1ad914c597f2ced6ddb356516a1413">  435</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a6a1ad914c597f2ced6ddb356516a1413">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l00436"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a19213bcaeaf5e7746176526f7c57de32">  436</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a19213bcaeaf5e7746176526f7c57de32">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l00437"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a3f408abe089b8476d19f809c976992d7">  437</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l00438"></a><span class="lineno">  438</span>&#160;</div><div class="line"><a name="l00440"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a08ebcc80c20f997c2e9385eeb8004b26">  440</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a08ebcc80c20f997c2e9385eeb8004b26">Operator</a> = Operator_;</div><div class="line"><a name="l00441"></a><span class="lineno">  441</span>&#160;</div><div class="line"><a name="l00443"></a><span class="lineno">  443</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l00444"></a><span class="lineno">  444</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l00445"></a><span class="lineno">  445</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l00446"></a><span class="lineno">  446</span>&#160;    PartitionsK</div><div class="line"><a name="l00447"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a7e17356aba016255ad9e5ee970e5cd8d">  447</a></span>&#160;  &gt;;</div><div class="line"><a name="l00448"></a><span class="lineno">  448</span>&#160;</div><div class="line"><a name="l00449"></a><span class="lineno">  449</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l00450"></a><span class="lineno">  450</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00451"></a><span class="lineno">  451</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l00452"></a><span class="lineno">  452</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l00453"></a><span class="lineno">  453</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l00454"></a><span class="lineno">  454</span>&#160;  );</div><div class="line"><a name="l00455"></a><span class="lineno">  455</span>&#160;</div><div class="line"><a name="l00457"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a018a1dcfae2420f8df12803b60c12563">  457</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l00458"></a><span class="lineno">  458</span>&#160;</div><div class="line"><a name="l00460"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a08416c46082a019721f129ac878ecce3">  460</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l00461"></a><span class="lineno">  461</span>&#160;</div><div class="line"><a name="l00462"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a36805c4cedb5ba75337ec6454baddb25">  462</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kElementsPerAccess = 1;</div><div class="line"><a name="l00463"></a><span class="lineno">  463</span>&#160;</div><div class="line"><a name="l00464"></a><span class="lineno">  464</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00465"></a><span class="lineno">  465</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l00466"></a><span class="lineno">  466</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00467"></a><span class="lineno">  467</span>&#160;</div><div class="line"><a name="l00468"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a5317ee97ce276f45ac7cecce2f82684a">  468</a></span>&#160;  <span class="keyword">using</span> SmemLayoutA = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00469"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a1699470cb8d19273758cae02c38c68ce">  469</a></span>&#160;  <span class="keyword">using</span> SmemLayoutB = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00470"></a><span class="lineno">  470</span>&#160;</div><div class="line"><a name="l00471"></a><span class="lineno">  471</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00472"></a><span class="lineno">  472</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l00473"></a><span class="lineno">  473</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00474"></a><span class="lineno">  474</span>&#160;</div><div class="line"><a name="l00476"></a><span class="lineno">  476</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00477"></a><span class="lineno">  477</span>&#160;    layout::PitchLinearShape&lt;Shape::kK, Shape::kM&gt;,</div><div class="line"><a name="l00478"></a><span class="lineno">  478</span>&#160;    kThreads,</div><div class="line"><a name="l00479"></a><span class="lineno">  479</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00480"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a269432cb8385f4cdc6783d122990410f">  480</a></span>&#160;  &gt;;</div><div class="line"><a name="l00481"></a><span class="lineno">  481</span>&#160;</div><div class="line"><a name="l00483"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a625b9d82585cf4baa3fb5e4ed16dd466">  483</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">transform::TransposePitchLinearThreadMapSimt&lt;IteratorThreadMapA&gt;</a>;</div><div class="line"><a name="l00484"></a><span class="lineno">  484</span>&#160;</div><div class="line"><a name="l00486"></a><span class="lineno">  486</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00487"></a><span class="lineno">  487</span>&#160;    MatrixShape&lt;Shape::kM, Shape::kK&gt;, </div><div class="line"><a name="l00488"></a><span class="lineno">  488</span>&#160;    ElementA, </div><div class="line"><a name="l00489"></a><span class="lineno">  489</span>&#160;    SmemLayoutA,</div><div class="line"><a name="l00490"></a><span class="lineno">  490</span>&#160;    1,</div><div class="line"><a name="l00491"></a><span class="lineno">  491</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapA</a></div><div class="line"><a name="l00492"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a9d88c7fe5a44bec0335b884abc9f7df8">  492</a></span>&#160;  &gt;;</div><div class="line"><a name="l00493"></a><span class="lineno">  493</span>&#160;</div><div class="line"><a name="l00495"></a><span class="lineno">  495</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00496"></a><span class="lineno">  496</span>&#160;    layout::PitchLinearShape&lt;Shape::kN, Shape::kK&gt;,</div><div class="line"><a name="l00497"></a><span class="lineno">  497</span>&#160;    kThreads,</div><div class="line"><a name="l00498"></a><span class="lineno">  498</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00499"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#ad6be000724ac447ecd66dd0720f05162">  499</a></span>&#160;  &gt;;</div><div class="line"><a name="l00500"></a><span class="lineno">  500</span>&#160;</div><div class="line"><a name="l00502"></a><span class="lineno">  502</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00503"></a><span class="lineno">  503</span>&#160;    MatrixShape&lt;Shape::kK, Shape::kN&gt;, </div><div class="line"><a name="l00504"></a><span class="lineno">  504</span>&#160;    ElementB, </div><div class="line"><a name="l00505"></a><span class="lineno">  505</span>&#160;    SmemLayoutB,</div><div class="line"><a name="l00506"></a><span class="lineno">  506</span>&#160;    0,</div><div class="line"><a name="l00507"></a><span class="lineno">  507</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapB</a></div><div class="line"><a name="l00508"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a11d653866788aab57d71df476834161d">  508</a></span>&#160;  &gt;;</div><div class="line"><a name="l00509"></a><span class="lineno">  509</span>&#160;</div><div class="line"><a name="l00510"></a><span class="lineno">  510</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00511"></a><span class="lineno">  511</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l00512"></a><span class="lineno">  512</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00513"></a><span class="lineno">  513</span>&#160;</div><div class="line"><a name="l00514"></a><span class="lineno">  514</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l00515"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a6dc8f07ec5732bf736ce05d48ebf3c56">  515</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l00516"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a0ee473c7b36abf5ab3abfe7598c4dbdc">  516</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l00517"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a3207284867d7865722c68f7458e0f931">  517</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l00518"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#adb7556874a35fface20ce9cf900be38a">  518</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l00519"></a><span class="lineno">  519</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l00520"></a><span class="lineno">  520</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l00521"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a0324e9579a1d801621325cd0c82b2d99">  521</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l00522"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#ae2f78a55a6e6f699419cb8f64acc3628">  522</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l00523"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aee55fd5f0201a4b98aaf07c49fb916fc">  523</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l00524"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a9db6f5e69a9d1ded6458b201fe43a006">  524</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsA, ThreadTileM);</div><div class="line"><a name="l00525"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#ab929adb91ea0dcf95dfc1081a82c6520">  525</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsB, ThreadTileN);</div><div class="line"><a name="l00526"></a><span class="lineno">  526</span>&#160;</div><div class="line"><a name="l00527"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#abfbcaec3b5165493373ee0e72b6cf975">  527</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingM = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>);</div><div class="line"><a name="l00528"></a><span class="lineno">  528</span>&#160;</div><div class="line"><a name="l00529"></a><span class="lineno">  529</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l00530"></a><span class="lineno">  530</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l00531"></a><span class="lineno">  531</span>&#160;      LaneM,</div><div class="line"><a name="l00532"></a><span class="lineno">  532</span>&#160;      LaneN,</div><div class="line"><a name="l00533"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a5bc6621f63ea24c3bc98c297b8d7603f">  533</a></span>&#160;      1&gt;;</div><div class="line"><a name="l00534"></a><span class="lineno">  534</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l00535"></a><span class="lineno">  535</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l00536"></a><span class="lineno">  536</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">cutlass::layout::RowMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l00537"></a><span class="lineno">  537</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l00538"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a0eebd627f3649fab55d71ea147f6ec82">  538</a></span>&#160;  &gt;;</div><div class="line"><a name="l00539"></a><span class="lineno">  539</span>&#160;</div><div class="line"><a name="l00540"></a><span class="lineno">  540</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l00541"></a><span class="lineno">  541</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aca4a8b44fb78de382813bd3bda11f5ce">WarpShape</a>,    </div><div class="line"><a name="l00542"></a><span class="lineno">  542</span>&#160;      ElementA,     </div><div class="line"><a name="l00543"></a><span class="lineno">  543</span>&#160;      SmemLayoutA,  </div><div class="line"><a name="l00544"></a><span class="lineno">  544</span>&#160;      ElementB,     </div><div class="line"><a name="l00545"></a><span class="lineno">  545</span>&#160;      SmemLayoutB,  </div><div class="line"><a name="l00546"></a><span class="lineno">  546</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aea4174e3f2e32dcd170dea50d5675369">ElementC</a>,     </div><div class="line"><a name="l00547"></a><span class="lineno">  547</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a6a1ad914c597f2ced6ddb356516a1413">LayoutC</a>,      </div><div class="line"><a name="l00548"></a><span class="lineno">  548</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>        </div><div class="line"><a name="l00549"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a72f4f59aa197a618e56037ff006482d2">  549</a></span>&#160;  &gt;;</div><div class="line"><a name="l00550"></a><span class="lineno">  550</span>&#160;</div><div class="line"><a name="l00552"></a><span class="lineno">  552</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#af2c71eb39f54a898753b9ff25e6f3072">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#af2c71eb39f54a898753b9ff25e6f3072">MmaPolicy</a>&lt;</div><div class="line"><a name="l00553"></a><span class="lineno">  553</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l00554"></a><span class="lineno">  554</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;kPaddingM, 0&gt;</a>,    <span class="comment">// skew for A matrix to avoid SMEM bank conflicts</span></div><div class="line"><a name="l00555"></a><span class="lineno">  555</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, 0&gt;</a>,</div><div class="line"><a name="l00556"></a><span class="lineno">  556</span>&#160;    WarpCount::kK</div><div class="line"><a name="l00557"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#af2c71eb39f54a898753b9ff25e6f3072">  557</a></span>&#160;  &gt;;</div><div class="line"><a name="l00558"></a><span class="lineno">  558</span>&#160;};</div><div class="line"><a name="l00559"></a><span class="lineno">  559</span>&#160;</div><div class="line"><a name="l00561"></a><span class="lineno">  561</span>&#160;</div><div class="line"><a name="l00569"></a><span class="lineno">  569</span>&#160;<span class="keyword">template</span> &lt;</div><div class="line"><a name="l00572"></a><span class="lineno">  572</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l00574"></a><span class="lineno">  574</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l00576"></a><span class="lineno">  576</span>&#160;    <span class="keyword">typename</span> ElementA_,</div><div class="line"><a name="l00578"></a><span class="lineno">  578</span>&#160;    <span class="keyword">typename</span> ElementB_,</div><div class="line"><a name="l00580"></a><span class="lineno">  580</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l00582"></a><span class="lineno">  582</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l00584"></a><span class="lineno">  584</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l00585"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html">  585</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 1&gt;, ElementA_,</div><div class="line"><a name="l00586"></a><span class="lineno">  586</span>&#160;                      layout::ColumnMajor, ElementB_, <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>,</div><div class="line"><a name="l00587"></a><span class="lineno">  587</span>&#160;                      ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l00588"></a><span class="lineno">  588</span>&#160;                     &gt; {</div><div class="line"><a name="l00589"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#adec0b67751d581deb517b0eaf74cc6f1">  589</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#adec0b67751d581deb517b0eaf74cc6f1">Shape</a> = Shape_;</div><div class="line"><a name="l00590"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a7030d7c50418f3b7bda8b6dbf594056f">  590</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a7030d7c50418f3b7bda8b6dbf594056f">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l00591"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a77672784e6e2f17669c018f4caea2700">  591</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 1&gt;</a>;</div><div class="line"><a name="l00592"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a2c9a0f9e8ed1ef32d2fe075aab67d603">  592</a></span>&#160;  <span class="keyword">using</span> ElementA = ElementA_;</div><div class="line"><a name="l00593"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a2abba1ee7e00d2cbafa6c2cc113f4523">  593</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00594"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aeea466e769f03e5c15406ab2f7614c50">  594</a></span>&#160;  <span class="keyword">using</span> ElementB = ElementB_;</div><div class="line"><a name="l00595"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a500021e29b6263b4faf4ac8d9011c5be">  595</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00596"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a70b15ab8005a28399d5f516545fc7a7c">  596</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a70b15ab8005a28399d5f516545fc7a7c">ElementC</a> = ElementC_;</div><div class="line"><a name="l00597"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aeb7ff4ca2dd952e411f92e8628d6c015">  597</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aeb7ff4ca2dd952e411f92e8628d6c015">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l00598"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#abb9841f9f90c868e9ec2ee0b19295534">  598</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#abb9841f9f90c868e9ec2ee0b19295534">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l00599"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aa33ac47916bd5e9458989915426c8b3b">  599</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l00600"></a><span class="lineno">  600</span>&#160;</div><div class="line"><a name="l00602"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a717f638b194fbbc0692ddd94282a6724">  602</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a717f638b194fbbc0692ddd94282a6724">Operator</a> = Operator_;</div><div class="line"><a name="l00603"></a><span class="lineno">  603</span>&#160;</div><div class="line"><a name="l00605"></a><span class="lineno">  605</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l00606"></a><span class="lineno">  606</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l00607"></a><span class="lineno">  607</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l00608"></a><span class="lineno">  608</span>&#160;    PartitionsK</div><div class="line"><a name="l00609"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a05eae33a361475acdf8830a798a2c3b3">  609</a></span>&#160;  &gt;;</div><div class="line"><a name="l00610"></a><span class="lineno">  610</span>&#160;</div><div class="line"><a name="l00611"></a><span class="lineno">  611</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l00612"></a><span class="lineno">  612</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00613"></a><span class="lineno">  613</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l00614"></a><span class="lineno">  614</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l00615"></a><span class="lineno">  615</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l00616"></a><span class="lineno">  616</span>&#160;  );</div><div class="line"><a name="l00617"></a><span class="lineno">  617</span>&#160;</div><div class="line"><a name="l00619"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a4fd0ab760457ff4a67e15a33f98d9ee8">  619</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l00620"></a><span class="lineno">  620</span>&#160;</div><div class="line"><a name="l00622"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#ab11fdc63d433ecd0be3224709b6552a8">  622</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l00623"></a><span class="lineno">  623</span>&#160;</div><div class="line"><a name="l00624"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a601876c23a6a30441744fff49e35219b">  624</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kElementsPerAccess = 1;</div><div class="line"><a name="l00625"></a><span class="lineno">  625</span>&#160;</div><div class="line"><a name="l00626"></a><span class="lineno">  626</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00627"></a><span class="lineno">  627</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l00628"></a><span class="lineno">  628</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00629"></a><span class="lineno">  629</span>&#160;</div><div class="line"><a name="l00630"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a6b00b5e6965772079c3cd4fafe6a08d2">  630</a></span>&#160;  <span class="keyword">using</span> SmemLayoutA = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00631"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a8d2d71b3c658a7e37ce29abd7c1c5157">  631</a></span>&#160;  <span class="keyword">using</span> SmemLayoutB = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00632"></a><span class="lineno">  632</span>&#160;</div><div class="line"><a name="l00633"></a><span class="lineno">  633</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00634"></a><span class="lineno">  634</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l00635"></a><span class="lineno">  635</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00636"></a><span class="lineno">  636</span>&#160;</div><div class="line"><a name="l00638"></a><span class="lineno">  638</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00639"></a><span class="lineno">  639</span>&#160;    layout::PitchLinearShape&lt;Shape::kM, Shape::kK&gt;,</div><div class="line"><a name="l00640"></a><span class="lineno">  640</span>&#160;    kThreads,</div><div class="line"><a name="l00641"></a><span class="lineno">  641</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00642"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a0f450843b1adf93a82d8fc2e3c58f769">  642</a></span>&#160;  &gt;;</div><div class="line"><a name="l00643"></a><span class="lineno">  643</span>&#160;</div><div class="line"><a name="l00645"></a><span class="lineno">  645</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00646"></a><span class="lineno">  646</span>&#160;    MatrixShape&lt;Shape::kM, Shape::kK&gt;, </div><div class="line"><a name="l00647"></a><span class="lineno">  647</span>&#160;    ElementA,</div><div class="line"><a name="l00648"></a><span class="lineno">  648</span>&#160;    SmemLayoutA,</div><div class="line"><a name="l00649"></a><span class="lineno">  649</span>&#160;    1,</div><div class="line"><a name="l00650"></a><span class="lineno">  650</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapA</a></div><div class="line"><a name="l00651"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#ab898ca6db537f16c9dd800be47cf7bff">  651</a></span>&#160;  &gt;;</div><div class="line"><a name="l00652"></a><span class="lineno">  652</span>&#160;</div><div class="line"><a name="l00654"></a><span class="lineno">  654</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">IteratorThreadMapB</a> =  <a class="code" href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">transform::PitchLinearStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00655"></a><span class="lineno">  655</span>&#160;    layout::PitchLinearShape&lt;Shape::kK, Shape::kN&gt;,</div><div class="line"><a name="l00656"></a><span class="lineno">  656</span>&#160;    kThreads,</div><div class="line"><a name="l00657"></a><span class="lineno">  657</span>&#160;    kElementsPerAccess</div><div class="line"><a name="l00658"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a89581e14b7ce8bc081a6a6a1ee9857d7">  658</a></span>&#160;  &gt;;</div><div class="line"><a name="l00659"></a><span class="lineno">  659</span>&#160;</div><div class="line"><a name="l00661"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aac0106f814a0488fb50497f65a401892">  661</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">transform::TransposePitchLinearThreadMapSimt&lt;IteratorThreadMapB&gt;</a>;</div><div class="line"><a name="l00662"></a><span class="lineno">  662</span>&#160;</div><div class="line"><a name="l00664"></a><span class="lineno">  664</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">transform::threadblock::RegularTileIterator</a>&lt;</div><div class="line"><a name="l00665"></a><span class="lineno">  665</span>&#160;    MatrixShape&lt;Shape::kK, Shape::kN&gt;, </div><div class="line"><a name="l00666"></a><span class="lineno">  666</span>&#160;    ElementB,</div><div class="line"><a name="l00667"></a><span class="lineno">  667</span>&#160;    SmemLayoutB,</div><div class="line"><a name="l00668"></a><span class="lineno">  668</span>&#160;    0,</div><div class="line"><a name="l00669"></a><span class="lineno">  669</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">SmemThreadMapB</a></div><div class="line"><a name="l00670"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aa0465a28382fbc55c793d4bf595a8a58">  670</a></span>&#160;  &gt;;</div><div class="line"><a name="l00671"></a><span class="lineno">  671</span>&#160;</div><div class="line"><a name="l00672"></a><span class="lineno">  672</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00673"></a><span class="lineno">  673</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l00674"></a><span class="lineno">  674</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00675"></a><span class="lineno">  675</span>&#160;</div><div class="line"><a name="l00676"></a><span class="lineno">  676</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l00677"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#ad3bb204696969cd9305266d8b56922b5">  677</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l00678"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#ab6179c422ea3c8673b0a62b0736d6d10">  678</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l00679"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#af1f8ae8f205ecc0a8f2fa4f8e91c7240">  679</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l00680"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aa7daa4db5819908bf594385a4084042c">  680</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l00681"></a><span class="lineno">  681</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l00682"></a><span class="lineno">  682</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l00683"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a1b986b60aa15efb6abf0813d555dac11">  683</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l00684"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a835a6be9306595a22328cd37c0e5c5f3">  684</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l00685"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a05260a45241f6401c4166c3476e16705">  685</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l00686"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#abbb050a9f8e623ef752a0d524e3f9c41">  686</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsA, ThreadTileM);</div><div class="line"><a name="l00687"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a73a9507bca254ae2811231205144ac7b">  687</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(numElementsB, ThreadTileN);</div><div class="line"><a name="l00688"></a><span class="lineno">  688</span>&#160;</div><div class="line"><a name="l00689"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a196c99c24aa9b108105d0488aaf7e058">  689</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingN = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>);</div><div class="line"><a name="l00690"></a><span class="lineno">  690</span>&#160;</div><div class="line"><a name="l00691"></a><span class="lineno">  691</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l00692"></a><span class="lineno">  692</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l00693"></a><span class="lineno">  693</span>&#160;      LaneM,</div><div class="line"><a name="l00694"></a><span class="lineno">  694</span>&#160;      LaneN,</div><div class="line"><a name="l00695"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a1fa217acb8da1bc6973b882e6e3fefe5">  695</a></span>&#160;      1&gt;;</div><div class="line"><a name="l00696"></a><span class="lineno">  696</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l00697"></a><span class="lineno">  697</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l00698"></a><span class="lineno">  698</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">cutlass::layout::RowMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l00699"></a><span class="lineno">  699</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l00700"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a5c0553c4e049d6ebcd87ba251080b77d">  700</a></span>&#160;  &gt;;</div><div class="line"><a name="l00701"></a><span class="lineno">  701</span>&#160;</div><div class="line"><a name="l00702"></a><span class="lineno">  702</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l00703"></a><span class="lineno">  703</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a7030d7c50418f3b7bda8b6dbf594056f">WarpShape</a>,    </div><div class="line"><a name="l00704"></a><span class="lineno">  704</span>&#160;      ElementA,     </div><div class="line"><a name="l00705"></a><span class="lineno">  705</span>&#160;      SmemLayoutA,  </div><div class="line"><a name="l00706"></a><span class="lineno">  706</span>&#160;      ElementB,     </div><div class="line"><a name="l00707"></a><span class="lineno">  707</span>&#160;      SmemLayoutB,  </div><div class="line"><a name="l00708"></a><span class="lineno">  708</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a70b15ab8005a28399d5f516545fc7a7c">ElementC</a>,     </div><div class="line"><a name="l00709"></a><span class="lineno">  709</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aeb7ff4ca2dd952e411f92e8628d6c015">LayoutC</a>,      </div><div class="line"><a name="l00710"></a><span class="lineno">  710</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>        </div><div class="line"><a name="l00711"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a5da02e8f8e757c09c7e59ad2750a7833">  711</a></span>&#160;  &gt;;</div><div class="line"><a name="l00712"></a><span class="lineno">  712</span>&#160;</div><div class="line"><a name="l00714"></a><span class="lineno">  714</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a62de2763f572e5a71e9587f49d0905e6">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a62de2763f572e5a71e9587f49d0905e6">MmaPolicy</a>&lt;</div><div class="line"><a name="l00715"></a><span class="lineno">  715</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l00716"></a><span class="lineno">  716</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, 0&gt;</a>,</div><div class="line"><a name="l00717"></a><span class="lineno">  717</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, kPaddingN&gt;</a>, <span class="comment">// skew for B matrix to avoid SMEM bank conflicts</span></div><div class="line"><a name="l00718"></a><span class="lineno">  718</span>&#160;    WarpCount::kK</div><div class="line"><a name="l00719"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a62de2763f572e5a71e9587f49d0905e6">  719</a></span>&#160;  &gt;;</div><div class="line"><a name="l00720"></a><span class="lineno">  720</span>&#160;};</div><div class="line"><a name="l00721"></a><span class="lineno">  721</span>&#160;</div><div class="line"><a name="l00723"></a><span class="lineno">  723</span>&#160;</div><div class="line"><a name="l00731"></a><span class="lineno">  731</span>&#160;<span class="keyword">template</span> &lt;</div><div class="line"><a name="l00734"></a><span class="lineno">  734</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l00736"></a><span class="lineno">  736</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l00738"></a><span class="lineno">  738</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l00740"></a><span class="lineno">  740</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l00742"></a><span class="lineno">  742</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l00743"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html">  743</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 4&gt;, int8_t,</div><div class="line"><a name="l00744"></a><span class="lineno">  744</span>&#160;                      layout::ColumnMajor, int8_t, <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>, ElementC_,</div><div class="line"><a name="l00745"></a><span class="lineno">  745</span>&#160;                      LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l00746"></a><span class="lineno">  746</span>&#160;                    &gt; {</div><div class="line"><a name="l00747"></a><span class="lineno">  747</span>&#160;</div><div class="line"><a name="l00748"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#af00303b35d278e533aaf3ae3ba82d017">  748</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#af00303b35d278e533aaf3ae3ba82d017">Shape</a> = Shape_;</div><div class="line"><a name="l00749"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a03ef3ea08d70d25e222ee0339afa1e0a">  749</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a03ef3ea08d70d25e222ee0339afa1e0a">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l00750"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a06edf3a91f98cc7a0e8ab9c01f30b21a">  750</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 4&gt;</a>;</div><div class="line"><a name="l00751"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a5fb3e0d7309e1689dc9319ec5b0b194d">  751</a></span>&#160;  <span class="keyword">using</span> ElementA = int8_t;</div><div class="line"><a name="l00752"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#acab21f4d5466d09c3c97a3729f27ce96">  752</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00753"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a3284d6d6771d39f72f26e72422c78d1c">  753</a></span>&#160;  <span class="keyword">using</span> ElementB = int8_t;</div><div class="line"><a name="l00754"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a034033ba6eb8d4a013536bd6bba4d289">  754</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00755"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#afe290c0c2c5dc44ca2f7b73d93f9fe6f">  755</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#afe290c0c2c5dc44ca2f7b73d93f9fe6f">ElementC</a> = ElementC_;</div><div class="line"><a name="l00756"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#acdc66d5a5d190e94e0562eed3d3ddf30">  756</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#acdc66d5a5d190e94e0562eed3d3ddf30">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l00757"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a63a2d785d9fa1e0373378b9801aec228">  757</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a63a2d785d9fa1e0373378b9801aec228">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l00758"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a521119adcd3eddf50876448c506a5e38">  758</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l00759"></a><span class="lineno">  759</span>&#160;</div><div class="line"><a name="l00761"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#af0d7f0f10f163b0191cebf5e920dfed3">  761</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#af0d7f0f10f163b0191cebf5e920dfed3">Operator</a> = Operator_;</div><div class="line"><a name="l00762"></a><span class="lineno">  762</span>&#160;</div><div class="line"><a name="l00764"></a><span class="lineno">  764</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l00765"></a><span class="lineno">  765</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l00766"></a><span class="lineno">  766</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l00767"></a><span class="lineno">  767</span>&#160;    PartitionsK</div><div class="line"><a name="l00768"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#accc41a6694b5b976a23819b29ea10239">  768</a></span>&#160;  &gt;;</div><div class="line"><a name="l00769"></a><span class="lineno">  769</span>&#160;</div><div class="line"><a name="l00770"></a><span class="lineno">  770</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l00771"></a><span class="lineno">  771</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00772"></a><span class="lineno">  772</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l00773"></a><span class="lineno">  773</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l00774"></a><span class="lineno">  774</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l00775"></a><span class="lineno">  775</span>&#160;  );</div><div class="line"><a name="l00776"></a><span class="lineno">  776</span>&#160;</div><div class="line"><a name="l00778"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#aabe489e7c3115f2083ec0c64d2459c08">  778</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l00779"></a><span class="lineno">  779</span>&#160;</div><div class="line"><a name="l00781"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a6b92b85ebec9e381f2fc5eaac9f61567">  781</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l00782"></a><span class="lineno">  782</span>&#160;</div><div class="line"><a name="l00783"></a><span class="lineno">  783</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00784"></a><span class="lineno">  784</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l00785"></a><span class="lineno">  785</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00786"></a><span class="lineno">  786</span>&#160;</div><div class="line"><a name="l00787"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a673e7626a670486dfb3fa9fb10b91779">  787</a></span>&#160;  <span class="keyword">using</span> SmemLayoutA = <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">layout::ColumnMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l00788"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a60921be2153e9cc79d2a9323c6450009">  788</a></span>&#160;  <span class="keyword">using</span> SmemLayoutB = <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">layout::RowMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l00789"></a><span class="lineno">  789</span>&#160;</div><div class="line"><a name="l00790"></a><span class="lineno">  790</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00791"></a><span class="lineno">  791</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l00792"></a><span class="lineno">  792</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00793"></a><span class="lineno">  793</span>&#160;</div><div class="line"><a name="l00795"></a><span class="lineno">  795</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00796"></a><span class="lineno">  796</span>&#160;    layout::PitchLinearShape&lt;Shape::kM, Shape::kK&gt;,</div><div class="line"><a name="l00797"></a><span class="lineno">  797</span>&#160;    kThreads,</div><div class="line"><a name="l00798"></a><span class="lineno">  798</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l00799"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a6034c733de72b0f3060f92102298c9d6">  799</a></span>&#160;  &gt;;</div><div class="line"><a name="l00800"></a><span class="lineno">  800</span>&#160;</div><div class="line"><a name="l00802"></a><span class="lineno">  802</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l00803"></a><span class="lineno">  803</span>&#160;    MatrixShape&lt;Shape::kM, Shape::kK&gt;, </div><div class="line"><a name="l00804"></a><span class="lineno">  804</span>&#160;    ElementA, </div><div class="line"><a name="l00805"></a><span class="lineno">  805</span>&#160;    SmemLayoutA,</div><div class="line"><a name="l00806"></a><span class="lineno">  806</span>&#160;    1,</div><div class="line"><a name="l00807"></a><span class="lineno">  807</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapA</a></div><div class="line"><a name="l00808"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#ac22f4fd8ca898dce6b189fc0bcb8d537">  808</a></span>&#160;  &gt;;</div><div class="line"><a name="l00809"></a><span class="lineno">  809</span>&#160;  </div><div class="line"><a name="l00810"></a><span class="lineno">  810</span>&#160;</div><div class="line"><a name="l00812"></a><span class="lineno">  812</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00813"></a><span class="lineno">  813</span>&#160;    layout::PitchLinearShape&lt;Shape::kN, Shape::kK&gt;,</div><div class="line"><a name="l00814"></a><span class="lineno">  814</span>&#160;    kThreads,</div><div class="line"><a name="l00815"></a><span class="lineno">  815</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l00816"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a81b77d546a00570e7941b5e08b37269c">  816</a></span>&#160;  &gt;;</div><div class="line"><a name="l00817"></a><span class="lineno">  817</span>&#160;</div><div class="line"><a name="l00819"></a><span class="lineno">  819</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l00820"></a><span class="lineno">  820</span>&#160;    MatrixShape&lt;Shape::kK, Shape::kN&gt;, </div><div class="line"><a name="l00821"></a><span class="lineno">  821</span>&#160;    ElementB, </div><div class="line"><a name="l00822"></a><span class="lineno">  822</span>&#160;    SmemLayoutB,</div><div class="line"><a name="l00823"></a><span class="lineno">  823</span>&#160;    0,</div><div class="line"><a name="l00824"></a><span class="lineno">  824</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapB</a></div><div class="line"><a name="l00825"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a14008d3c0644ca2ef7774ec166760a80">  825</a></span>&#160;  &gt;;</div><div class="line"><a name="l00826"></a><span class="lineno">  826</span>&#160;</div><div class="line"><a name="l00827"></a><span class="lineno">  827</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00828"></a><span class="lineno">  828</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l00829"></a><span class="lineno">  829</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00830"></a><span class="lineno">  830</span>&#160;</div><div class="line"><a name="l00831"></a><span class="lineno">  831</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l00832"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a65d7c200bc30359936ad67c853335203">  832</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l00833"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#ac3be323ac103c41ae6a41aed8176d29f">  833</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l00834"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#aaade2637929dc0af96ee80ea3b9f5bff">  834</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l00835"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a61528d63fb17c57cb5ed53f5607328db">  835</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l00836"></a><span class="lineno">  836</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l00837"></a><span class="lineno">  837</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l00838"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a66c65842f2237de04938014b1e443547">  838</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l00839"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a3c5ed5647ab4879e510bcafae4bfe6d4">  839</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l00840"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a561b22b9a9475a6e29a5e40c3ec1c588">  840</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l00841"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a1d4eae7e2ea69cc172dbde0d6819af1b">  841</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileM);</div><div class="line"><a name="l00842"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#afd4a52cec8cb61475cc856eb23189af8">  842</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileN);</div><div class="line"><a name="l00843"></a><span class="lineno">  843</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l00844"></a><span class="lineno">  844</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l00845"></a><span class="lineno">  845</span>&#160;      LaneM,</div><div class="line"><a name="l00846"></a><span class="lineno">  846</span>&#160;      LaneN,</div><div class="line"><a name="l00847"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a030d4d758adeae583d0d80871773fec0">  847</a></span>&#160;      4&gt;;</div><div class="line"><a name="l00848"></a><span class="lineno">  848</span>&#160;</div><div class="line"><a name="l00849"></a><span class="lineno">  849</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l00850"></a><span class="lineno">  850</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l00851"></a><span class="lineno">  851</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">cutlass::layout::ColumnMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l00852"></a><span class="lineno">  852</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l00853"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a6d1fb04576af9af3d989c39545d810d4">  853</a></span>&#160;  &gt;;</div><div class="line"><a name="l00854"></a><span class="lineno">  854</span>&#160;</div><div class="line"><a name="l00855"></a><span class="lineno">  855</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l00856"></a><span class="lineno">  856</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a03ef3ea08d70d25e222ee0339afa1e0a">WarpShape</a>,    </div><div class="line"><a name="l00857"></a><span class="lineno">  857</span>&#160;    ElementA,     </div><div class="line"><a name="l00858"></a><span class="lineno">  858</span>&#160;    SmemLayoutA,  </div><div class="line"><a name="l00859"></a><span class="lineno">  859</span>&#160;    ElementB,     </div><div class="line"><a name="l00860"></a><span class="lineno">  860</span>&#160;    SmemLayoutB,  </div><div class="line"><a name="l00861"></a><span class="lineno">  861</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#afe290c0c2c5dc44ca2f7b73d93f9fe6f">ElementC</a>,     </div><div class="line"><a name="l00862"></a><span class="lineno">  862</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#acdc66d5a5d190e94e0562eed3d3ddf30">LayoutC</a>,      </div><div class="line"><a name="l00863"></a><span class="lineno">  863</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>,       </div><div class="line"><a name="l00864"></a><span class="lineno">  864</span>&#160;    PartitionsK   </div><div class="line"><a name="l00865"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#ad2299d968635843d88000386bd2ca20d">  865</a></span>&#160;    &gt;;</div><div class="line"><a name="l00866"></a><span class="lineno">  866</span>&#160;</div><div class="line"><a name="l00868"></a><span class="lineno">  868</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#aada86baebc846e6614f3616688477fba">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#aada86baebc846e6614f3616688477fba">MmaPolicy</a>&lt;</div><div class="line"><a name="l00869"></a><span class="lineno">  869</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l00870"></a><span class="lineno">  870</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, 0&gt;</a>,</div><div class="line"><a name="l00871"></a><span class="lineno">  871</span>&#160;    MatrixShape&lt;0, 0&gt;,</div><div class="line"><a name="l00872"></a><span class="lineno">  872</span>&#160;    WarpCount::kK</div><div class="line"><a name="l00873"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#aada86baebc846e6614f3616688477fba">  873</a></span>&#160;  &gt;;</div><div class="line"><a name="l00874"></a><span class="lineno">  874</span>&#160;};</div><div class="line"><a name="l00875"></a><span class="lineno">  875</span>&#160;</div><div class="line"><a name="l00878"></a><span class="lineno">  878</span>&#160;<span class="comment">//</span></div><div class="line"><a name="l00885"></a><span class="lineno">  885</span>&#160;<span class="comment"></span><span class="keyword">template</span> &lt;</div><div class="line"><a name="l00888"></a><span class="lineno">  888</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l00890"></a><span class="lineno">  890</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l00892"></a><span class="lineno">  892</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l00894"></a><span class="lineno">  894</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l00896"></a><span class="lineno">  896</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l00897"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html">  897</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 4&gt;, int8_t,</div><div class="line"><a name="l00898"></a><span class="lineno">  898</span>&#160;                      layout::RowMajor, int8_t, <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>, ElementC_,</div><div class="line"><a name="l00899"></a><span class="lineno">  899</span>&#160;                      LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l00900"></a><span class="lineno">  900</span>&#160;                      &gt; {</div><div class="line"><a name="l00901"></a><span class="lineno">  901</span>&#160;</div><div class="line"><a name="l00902"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a3bd2c938edb75c58d6b0d9f5f9970239">  902</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a3bd2c938edb75c58d6b0d9f5f9970239">Shape</a> = Shape_;</div><div class="line"><a name="l00903"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a9e0ab047c9957fc0e3ce232e98c91a7e">  903</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a9e0ab047c9957fc0e3ce232e98c91a7e">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l00904"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a57c8d3edfc3202db15382b5f19835e3c">  904</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 4&gt;</a>;</div><div class="line"><a name="l00905"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#af3694b5c3cfbe1cb15564498b6834dfb">  905</a></span>&#160;  <span class="keyword">using</span> ElementA = int8_t;</div><div class="line"><a name="l00906"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a2f121d87f28c3f69a37813fce5e193be">  906</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l00907"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a9cd48403279034ae9267b4ff3019bfbe">  907</a></span>&#160;  <span class="keyword">using</span> ElementB = int8_t;</div><div class="line"><a name="l00908"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a44f471eebd05eb3c24fb6de9bbb56a95">  908</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l00909"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ade835163d1fac35dce14031c37bebb96">  909</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ade835163d1fac35dce14031c37bebb96">ElementC</a> = ElementC_;</div><div class="line"><a name="l00910"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae3de45321d07b5b45e17b1ba7ff136ce">  910</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae3de45321d07b5b45e17b1ba7ff136ce">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l00911"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ac694a206c028c5e55610f6477da8ed94">  911</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ac694a206c028c5e55610f6477da8ed94">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l00912"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae22e247d96d9d8e2e49ae69fce1002c3">  912</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l00913"></a><span class="lineno">  913</span>&#160;</div><div class="line"><a name="l00915"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ab9073ff38dd4579f65b461f887d8e9f6">  915</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ab9073ff38dd4579f65b461f887d8e9f6">Operator</a> = Operator_;</div><div class="line"><a name="l00916"></a><span class="lineno">  916</span>&#160;</div><div class="line"><a name="l00918"></a><span class="lineno">  918</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l00919"></a><span class="lineno">  919</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l00920"></a><span class="lineno">  920</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l00921"></a><span class="lineno">  921</span>&#160;    PartitionsK</div><div class="line"><a name="l00922"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a49c58c46efaea921d86607f56cba7066">  922</a></span>&#160;  &gt;;</div><div class="line"><a name="l00923"></a><span class="lineno">  923</span>&#160;</div><div class="line"><a name="l00924"></a><span class="lineno">  924</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l00925"></a><span class="lineno">  925</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l00926"></a><span class="lineno">  926</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l00927"></a><span class="lineno">  927</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l00928"></a><span class="lineno">  928</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l00929"></a><span class="lineno">  929</span>&#160;  );</div><div class="line"><a name="l00930"></a><span class="lineno">  930</span>&#160;</div><div class="line"><a name="l00932"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae290ffe7237c2aac3b87528927df4289">  932</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l00933"></a><span class="lineno">  933</span>&#160;</div><div class="line"><a name="l00935"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a75d55d083ad9c4a59222366b802bfc41">  935</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l00936"></a><span class="lineno">  936</span>&#160;</div><div class="line"><a name="l00937"></a><span class="lineno">  937</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00938"></a><span class="lineno">  938</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l00939"></a><span class="lineno">  939</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00940"></a><span class="lineno">  940</span>&#160;</div><div class="line"><a name="l00941"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae2b9215d830e83f89619bb1eb94052d6">  941</a></span>&#160;  <span class="keyword">using</span> SmemLayoutA = <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">layout::ColumnMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l00942"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a414b095cacbeae1375800ce8e190495e">  942</a></span>&#160;  <span class="keyword">using</span> SmemLayoutB = <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">layout::RowMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l00943"></a><span class="lineno">  943</span>&#160;</div><div class="line"><a name="l00944"></a><span class="lineno">  944</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00945"></a><span class="lineno">  945</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l00946"></a><span class="lineno">  946</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00947"></a><span class="lineno">  947</span>&#160;</div><div class="line"><a name="l00949"></a><span class="lineno">  949</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00950"></a><span class="lineno">  950</span>&#160;    layout::PitchLinearShape&lt;Shape::kK, Shape::kM&gt;,</div><div class="line"><a name="l00951"></a><span class="lineno">  951</span>&#160;    kThreads,</div><div class="line"><a name="l00952"></a><span class="lineno">  952</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l00953"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a11b7dc567a5f7bb381827b8409530f6a">  953</a></span>&#160;  &gt;;</div><div class="line"><a name="l00954"></a><span class="lineno">  954</span>&#160;</div><div class="line"><a name="l00956"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#aaf46eaa6a7a79376d0aad79c43af8684">  956</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">transform::TransposePitchLinearThreadMap2DThreadTile&lt;IteratorThreadMapA&gt;</a>;</div><div class="line"><a name="l00957"></a><span class="lineno">  957</span>&#160;</div><div class="line"><a name="l00959"></a><span class="lineno">  959</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l00960"></a><span class="lineno">  960</span>&#160;    MatrixShape&lt;Shape::kM, Shape::kK&gt;, </div><div class="line"><a name="l00961"></a><span class="lineno">  961</span>&#160;    ElementA, </div><div class="line"><a name="l00962"></a><span class="lineno">  962</span>&#160;    SmemLayoutA,</div><div class="line"><a name="l00963"></a><span class="lineno">  963</span>&#160;    1,</div><div class="line"><a name="l00964"></a><span class="lineno">  964</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapA</a></div><div class="line"><a name="l00965"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a7633f7038f950d77730873b3a47441ab">  965</a></span>&#160;  &gt;;</div><div class="line"><a name="l00966"></a><span class="lineno">  966</span>&#160;  </div><div class="line"><a name="l00967"></a><span class="lineno">  967</span>&#160;</div><div class="line"><a name="l00969"></a><span class="lineno">  969</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l00970"></a><span class="lineno">  970</span>&#160;    layout::PitchLinearShape&lt;Shape::kK, Shape::kN&gt;,</div><div class="line"><a name="l00971"></a><span class="lineno">  971</span>&#160;    kThreads,</div><div class="line"><a name="l00972"></a><span class="lineno">  972</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l00973"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#aede8b6f434f8bc14a337820d7c79abf2">  973</a></span>&#160;  &gt;;</div><div class="line"><a name="l00974"></a><span class="lineno">  974</span>&#160;</div><div class="line"><a name="l00976"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae8f2b98ab2b00f8addb6f85e8ff3de27">  976</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">transform::TransposePitchLinearThreadMap2DThreadTile&lt;IteratorThreadMapB&gt;</a>;</div><div class="line"><a name="l00977"></a><span class="lineno">  977</span>&#160;</div><div class="line"><a name="l00979"></a><span class="lineno">  979</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l00980"></a><span class="lineno">  980</span>&#160;    MatrixShape&lt;Shape::kK, Shape::kN&gt;, </div><div class="line"><a name="l00981"></a><span class="lineno">  981</span>&#160;    ElementB, </div><div class="line"><a name="l00982"></a><span class="lineno">  982</span>&#160;    SmemLayoutB,</div><div class="line"><a name="l00983"></a><span class="lineno">  983</span>&#160;    0,</div><div class="line"><a name="l00984"></a><span class="lineno">  984</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapB</a></div><div class="line"><a name="l00985"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a518bd61d9a82b9a6d0acf18e4fd9284f">  985</a></span>&#160;  &gt;;</div><div class="line"><a name="l00986"></a><span class="lineno">  986</span>&#160;</div><div class="line"><a name="l00987"></a><span class="lineno">  987</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00988"></a><span class="lineno">  988</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l00989"></a><span class="lineno">  989</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l00990"></a><span class="lineno">  990</span>&#160;</div><div class="line"><a name="l00991"></a><span class="lineno">  991</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l00992"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a5eeec4441d70152df9d7f30d769e86a8">  992</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l00993"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a29e6f52efc96b9be70233a34dc2e9de3">  993</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l00994"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a4dc03b1fd234520991b093ae64bbb65f">  994</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l00995"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a1e32a066033992f71fa1e1fa77a6222a">  995</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l00996"></a><span class="lineno">  996</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l00997"></a><span class="lineno">  997</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l00998"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a7cb67e3594ca449c7d2aa96a53af4a1b">  998</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l00999"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#acb471a82804720e617b55648e61a93e4">  999</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l01000"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a41680f60612611b17181a36a4ee9905b"> 1000</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l01001"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#aad83ca7a224399e3475bb40d2d33ce99"> 1001</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileM);</div><div class="line"><a name="l01002"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a8b867e482c60af0034b5f824af18cf4b"> 1002</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileN);</div><div class="line"><a name="l01003"></a><span class="lineno"> 1003</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l01004"></a><span class="lineno"> 1004</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l01005"></a><span class="lineno"> 1005</span>&#160;      LaneM,</div><div class="line"><a name="l01006"></a><span class="lineno"> 1006</span>&#160;      LaneN,</div><div class="line"><a name="l01007"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae491f8ca4cf60e4ec48e14c364ba5346"> 1007</a></span>&#160;      4&gt;;</div><div class="line"><a name="l01008"></a><span class="lineno"> 1008</span>&#160;</div><div class="line"><a name="l01009"></a><span class="lineno"> 1009</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l01010"></a><span class="lineno"> 1010</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l01011"></a><span class="lineno"> 1011</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">cutlass::layout::ColumnMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l01012"></a><span class="lineno"> 1012</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l01013"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a5b4fe0717b80227cb8af9e705a058c05"> 1013</a></span>&#160;  &gt;;</div><div class="line"><a name="l01014"></a><span class="lineno"> 1014</span>&#160;</div><div class="line"><a name="l01015"></a><span class="lineno"> 1015</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l01016"></a><span class="lineno"> 1016</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a9e0ab047c9957fc0e3ce232e98c91a7e">WarpShape</a>,    </div><div class="line"><a name="l01017"></a><span class="lineno"> 1017</span>&#160;    ElementA,     </div><div class="line"><a name="l01018"></a><span class="lineno"> 1018</span>&#160;    SmemLayoutA,  </div><div class="line"><a name="l01019"></a><span class="lineno"> 1019</span>&#160;    ElementB,     </div><div class="line"><a name="l01020"></a><span class="lineno"> 1020</span>&#160;    SmemLayoutB,  </div><div class="line"><a name="l01021"></a><span class="lineno"> 1021</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ade835163d1fac35dce14031c37bebb96">ElementC</a>,     </div><div class="line"><a name="l01022"></a><span class="lineno"> 1022</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae3de45321d07b5b45e17b1ba7ff136ce">LayoutC</a>,      </div><div class="line"><a name="l01023"></a><span class="lineno"> 1023</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>,       </div><div class="line"><a name="l01024"></a><span class="lineno"> 1024</span>&#160;    PartitionsK   </div><div class="line"><a name="l01025"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#acba9ead4e2ec4c4b99d7d22f492acf74"> 1025</a></span>&#160;    &gt;;</div><div class="line"><a name="l01026"></a><span class="lineno"> 1026</span>&#160;</div><div class="line"><a name="l01027"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#aad05aa4bf8d369467d71a40dbddd9f30"> 1027</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingM = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>);</div><div class="line"><a name="l01028"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a03e627a13f5a22475df6dbdd6c68d151"> 1028</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingN = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>);</div><div class="line"><a name="l01029"></a><span class="lineno"> 1029</span>&#160;</div><div class="line"><a name="l01031"></a><span class="lineno"> 1031</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ad8f801b18df3a58f83aa5e8ce325fcf6">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ad8f801b18df3a58f83aa5e8ce325fcf6">MmaPolicy</a>&lt;</div><div class="line"><a name="l01032"></a><span class="lineno"> 1032</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l01033"></a><span class="lineno"> 1033</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;kPaddingM, 0&gt;</a>,</div><div class="line"><a name="l01034"></a><span class="lineno"> 1034</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, kPaddingN&gt;</a>,</div><div class="line"><a name="l01035"></a><span class="lineno"> 1035</span>&#160;    WarpCount::kK</div><div class="line"><a name="l01036"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ad8f801b18df3a58f83aa5e8ce325fcf6"> 1036</a></span>&#160;  &gt;;</div><div class="line"><a name="l01037"></a><span class="lineno"> 1037</span>&#160;};</div><div class="line"><a name="l01038"></a><span class="lineno"> 1038</span>&#160;</div><div class="line"><a name="l01041"></a><span class="lineno"> 1041</span>&#160;<span class="comment">//</span></div><div class="line"><a name="l01048"></a><span class="lineno"> 1048</span>&#160;<span class="comment"></span><span class="keyword">template</span> &lt;</div><div class="line"><a name="l01051"></a><span class="lineno"> 1051</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l01053"></a><span class="lineno"> 1053</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l01055"></a><span class="lineno"> 1055</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l01057"></a><span class="lineno"> 1057</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l01059"></a><span class="lineno"> 1059</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l01060"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html"> 1060</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 4&gt;, int8_t,</div><div class="line"><a name="l01061"></a><span class="lineno"> 1061</span>&#160;                      layout::RowMajor, int8_t, <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>, ElementC_,</div><div class="line"><a name="l01062"></a><span class="lineno"> 1062</span>&#160;                      LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l01063"></a><span class="lineno"> 1063</span>&#160;                      &gt; {</div><div class="line"><a name="l01064"></a><span class="lineno"> 1064</span>&#160;</div><div class="line"><a name="l01065"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ac013076a3c9380a79407ad708ac09eb3"> 1065</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ac013076a3c9380a79407ad708ac09eb3">Shape</a> = Shape_;</div><div class="line"><a name="l01066"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aa62154dc21ce92b46887cefe5fcf3054"> 1066</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aa62154dc21ce92b46887cefe5fcf3054">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l01067"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aa3c6e36d439c7ac96d1fb5ae28f7394e"> 1067</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 4&gt;</a>;</div><div class="line"><a name="l01068"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#adda37c22ddc18461524cc0d97c4245f9"> 1068</a></span>&#160;  <span class="keyword">using</span> ElementA = int8_t;</div><div class="line"><a name="l01069"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af884e14f4e9bfb37f6273d7360729524"> 1069</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l01070"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a89597f580f16eaef469595c6ac183104"> 1070</a></span>&#160;  <span class="keyword">using</span> ElementB = int8_t;</div><div class="line"><a name="l01071"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a9dc63d44b2cf0b8f6c7e93f3234e65e9"> 1071</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1RowMajor.html">layout::RowMajor</a>;</div><div class="line"><a name="l01072"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ad3fce3b8a477190dc5d335b549b12c85"> 1072</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ad3fce3b8a477190dc5d335b549b12c85">ElementC</a> = ElementC_;</div><div class="line"><a name="l01073"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af7b416c742dacf93ab522a40699c6c71"> 1073</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af7b416c742dacf93ab522a40699c6c71">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l01074"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af274c0fe139375dd34d0ea3dfbaf9703"> 1074</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af274c0fe139375dd34d0ea3dfbaf9703">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l01075"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ab81183f42ddd0474c45bd4ecfd2f91cb"> 1075</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l01076"></a><span class="lineno"> 1076</span>&#160;</div><div class="line"><a name="l01078"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a373439df9ac285ab153ac52d1953e8d4"> 1078</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a373439df9ac285ab153ac52d1953e8d4">Operator</a> = Operator_;</div><div class="line"><a name="l01079"></a><span class="lineno"> 1079</span>&#160;</div><div class="line"><a name="l01081"></a><span class="lineno"> 1081</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l01082"></a><span class="lineno"> 1082</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l01083"></a><span class="lineno"> 1083</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l01084"></a><span class="lineno"> 1084</span>&#160;    PartitionsK</div><div class="line"><a name="l01085"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a7db68b43c401c881e622ece588dd3e13"> 1085</a></span>&#160;  &gt;;</div><div class="line"><a name="l01086"></a><span class="lineno"> 1086</span>&#160;</div><div class="line"><a name="l01087"></a><span class="lineno"> 1087</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l01088"></a><span class="lineno"> 1088</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l01089"></a><span class="lineno"> 1089</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l01090"></a><span class="lineno"> 1090</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l01091"></a><span class="lineno"> 1091</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l01092"></a><span class="lineno"> 1092</span>&#160;  );</div><div class="line"><a name="l01093"></a><span class="lineno"> 1093</span>&#160;</div><div class="line"><a name="l01095"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a40bc7311a7bce3a1720a12c8442335c5"> 1095</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l01096"></a><span class="lineno"> 1096</span>&#160;</div><div class="line"><a name="l01098"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ac8eeafe5d1ca4cd04ab498e34a93a650"> 1098</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l01099"></a><span class="lineno"> 1099</span>&#160;</div><div class="line"><a name="l01100"></a><span class="lineno"> 1100</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01101"></a><span class="lineno"> 1101</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l01102"></a><span class="lineno"> 1102</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01103"></a><span class="lineno"> 1103</span>&#160;</div><div class="line"><a name="l01104"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a3dece287e07abfe783bb7290b1fe4e45"> 1104</a></span>&#160;  <span class="keyword">using</span> SmemLayoutA = <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">layout::ColumnMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l01105"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a4ff05ff60f5c5faaf31ffa5129408922"> 1105</a></span>&#160;  <span class="keyword">using</span> SmemLayoutB = <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">layout::RowMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l01106"></a><span class="lineno"> 1106</span>&#160;</div><div class="line"><a name="l01107"></a><span class="lineno"> 1107</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01108"></a><span class="lineno"> 1108</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l01109"></a><span class="lineno"> 1109</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01110"></a><span class="lineno"> 1110</span>&#160;</div><div class="line"><a name="l01112"></a><span class="lineno"> 1112</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l01113"></a><span class="lineno"> 1113</span>&#160;    layout::PitchLinearShape&lt;Shape::kK, Shape::kM&gt;,</div><div class="line"><a name="l01114"></a><span class="lineno"> 1114</span>&#160;    kThreads,</div><div class="line"><a name="l01115"></a><span class="lineno"> 1115</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l01116"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ab265cae212878b47d8eb4050e5e63474"> 1116</a></span>&#160;  &gt;;</div><div class="line"><a name="l01117"></a><span class="lineno"> 1117</span>&#160;</div><div class="line"><a name="l01119"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a974e7c189bb1844e3d1c9ff286630191"> 1119</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">transform::TransposePitchLinearThreadMap2DThreadTile&lt;IteratorThreadMapA&gt;</a>;</div><div class="line"><a name="l01120"></a><span class="lineno"> 1120</span>&#160;</div><div class="line"><a name="l01122"></a><span class="lineno"> 1122</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l01123"></a><span class="lineno"> 1123</span>&#160;    MatrixShape&lt;Shape::kM, Shape::kK&gt;, </div><div class="line"><a name="l01124"></a><span class="lineno"> 1124</span>&#160;    ElementA, </div><div class="line"><a name="l01125"></a><span class="lineno"> 1125</span>&#160;    SmemLayoutA,</div><div class="line"><a name="l01126"></a><span class="lineno"> 1126</span>&#160;    1,</div><div class="line"><a name="l01127"></a><span class="lineno"> 1127</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapA</a></div><div class="line"><a name="l01128"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ae8f07bf158733bcdf4ed213a7b4d152f"> 1128</a></span>&#160;  &gt;;</div><div class="line"><a name="l01129"></a><span class="lineno"> 1129</span>&#160;  </div><div class="line"><a name="l01131"></a><span class="lineno"> 1131</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l01132"></a><span class="lineno"> 1132</span>&#160;    layout::PitchLinearShape&lt;Shape::kN, Shape::kK&gt;,</div><div class="line"><a name="l01133"></a><span class="lineno"> 1133</span>&#160;    kThreads,</div><div class="line"><a name="l01134"></a><span class="lineno"> 1134</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l01135"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#abd3a92eaa779a0148b42921ef1e6b82c"> 1135</a></span>&#160;  &gt;;</div><div class="line"><a name="l01136"></a><span class="lineno"> 1136</span>&#160;</div><div class="line"><a name="l01138"></a><span class="lineno"> 1138</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l01139"></a><span class="lineno"> 1139</span>&#160;    MatrixShape&lt;Shape::kK, Shape::kN&gt;, </div><div class="line"><a name="l01140"></a><span class="lineno"> 1140</span>&#160;    ElementB, </div><div class="line"><a name="l01141"></a><span class="lineno"> 1141</span>&#160;    SmemLayoutB,</div><div class="line"><a name="l01142"></a><span class="lineno"> 1142</span>&#160;    0,</div><div class="line"><a name="l01143"></a><span class="lineno"> 1143</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapB</a></div><div class="line"><a name="l01144"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ac7ff41e4f0c100d5d8bfdef2331ac88d"> 1144</a></span>&#160;  &gt;;</div><div class="line"><a name="l01145"></a><span class="lineno"> 1145</span>&#160;</div><div class="line"><a name="l01146"></a><span class="lineno"> 1146</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01147"></a><span class="lineno"> 1147</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l01148"></a><span class="lineno"> 1148</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01149"></a><span class="lineno"> 1149</span>&#160;</div><div class="line"><a name="l01150"></a><span class="lineno"> 1150</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l01151"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#afc60a4840a2d67688ab8323face7fbf7"> 1151</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l01152"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aee330d2671f6b945d31925e3ee034ea1"> 1152</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l01153"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a5454319e4e1764e23ad29742f5bd65d8"> 1153</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l01154"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ae543e3db5d0e941ad9b6c32adf4c83a7"> 1154</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l01155"></a><span class="lineno"> 1155</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l01156"></a><span class="lineno"> 1156</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l01157"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a496cf8aeb1401f238ec18fb268b7a04d"> 1157</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l01158"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a5902b3af8309ead3697e609a03ed48f9"> 1158</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l01159"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#afa68116da82624b365fbf784b01ec091"> 1159</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l01160"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a2891eb4dfe107d5e206d82c9b409f538"> 1160</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileM);</div><div class="line"><a name="l01161"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aa33a2aa437c69706a61863c182e7d033"> 1161</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileN);</div><div class="line"><a name="l01162"></a><span class="lineno"> 1162</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l01163"></a><span class="lineno"> 1163</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l01164"></a><span class="lineno"> 1164</span>&#160;      LaneM,</div><div class="line"><a name="l01165"></a><span class="lineno"> 1165</span>&#160;      LaneN,</div><div class="line"><a name="l01166"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a29c891204ddc7ff86d296dfab985a731"> 1166</a></span>&#160;      4&gt;;</div><div class="line"><a name="l01167"></a><span class="lineno"> 1167</span>&#160;</div><div class="line"><a name="l01168"></a><span class="lineno"> 1168</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l01169"></a><span class="lineno"> 1169</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l01170"></a><span class="lineno"> 1170</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">cutlass::layout::ColumnMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l01171"></a><span class="lineno"> 1171</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l01172"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a76f447f264ee662e71140dab01124398"> 1172</a></span>&#160;  &gt;;</div><div class="line"><a name="l01173"></a><span class="lineno"> 1173</span>&#160;</div><div class="line"><a name="l01174"></a><span class="lineno"> 1174</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l01175"></a><span class="lineno"> 1175</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aa62154dc21ce92b46887cefe5fcf3054">WarpShape</a>,    </div><div class="line"><a name="l01176"></a><span class="lineno"> 1176</span>&#160;    ElementA,     </div><div class="line"><a name="l01177"></a><span class="lineno"> 1177</span>&#160;    SmemLayoutA,  </div><div class="line"><a name="l01178"></a><span class="lineno"> 1178</span>&#160;    ElementB,     </div><div class="line"><a name="l01179"></a><span class="lineno"> 1179</span>&#160;    SmemLayoutB,  </div><div class="line"><a name="l01180"></a><span class="lineno"> 1180</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ad3fce3b8a477190dc5d335b549b12c85">ElementC</a>,     </div><div class="line"><a name="l01181"></a><span class="lineno"> 1181</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af7b416c742dacf93ab522a40699c6c71">LayoutC</a>,      </div><div class="line"><a name="l01182"></a><span class="lineno"> 1182</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>,       </div><div class="line"><a name="l01183"></a><span class="lineno"> 1183</span>&#160;    PartitionsK   </div><div class="line"><a name="l01184"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a4c28590242538f752a18f7fc9d7959da"> 1184</a></span>&#160;    &gt;;</div><div class="line"><a name="l01185"></a><span class="lineno"> 1185</span>&#160;</div><div class="line"><a name="l01186"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ae227984ba1993b8b2def4156128907ea"> 1186</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingM = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>);</div><div class="line"><a name="l01187"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aa737480b656ac28df15de8ae82a631fa"> 1187</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingN = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>);</div><div class="line"><a name="l01188"></a><span class="lineno"> 1188</span>&#160;</div><div class="line"><a name="l01190"></a><span class="lineno"> 1190</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aabe20df5c98890c82bdd20c351fb9709">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aabe20df5c98890c82bdd20c351fb9709">MmaPolicy</a>&lt;</div><div class="line"><a name="l01191"></a><span class="lineno"> 1191</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l01192"></a><span class="lineno"> 1192</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;kPaddingM, 0&gt;</a>,</div><div class="line"><a name="l01193"></a><span class="lineno"> 1193</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, 0&gt;</a>,</div><div class="line"><a name="l01194"></a><span class="lineno"> 1194</span>&#160;    WarpCount::kK</div><div class="line"><a name="l01195"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aabe20df5c98890c82bdd20c351fb9709"> 1195</a></span>&#160;  &gt;;</div><div class="line"><a name="l01196"></a><span class="lineno"> 1196</span>&#160;};</div><div class="line"><a name="l01197"></a><span class="lineno"> 1197</span>&#160;</div><div class="line"><a name="l01200"></a><span class="lineno"> 1200</span>&#160;<span class="comment">//</span></div><div class="line"><a name="l01207"></a><span class="lineno"> 1207</span>&#160;<span class="comment"></span><span class="keyword">template</span> &lt;</div><div class="line"><a name="l01210"></a><span class="lineno"> 1210</span>&#160;    <span class="keyword">typename</span> Shape_,</div><div class="line"><a name="l01212"></a><span class="lineno"> 1212</span>&#160;    <span class="keyword">typename</span> WarpShape_,</div><div class="line"><a name="l01214"></a><span class="lineno"> 1214</span>&#160;    <span class="keyword">typename</span> ElementC_,</div><div class="line"><a name="l01216"></a><span class="lineno"> 1216</span>&#160;    <span class="keyword">typename</span> LayoutC_,</div><div class="line"><a name="l01218"></a><span class="lineno"> 1218</span>&#160;    <span class="keyword">typename</span> Operator_&gt;</div><div class="line"><a name="l01219"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html"> 1219</a></span>&#160;<span class="keyword">struct </span><a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">DefaultMmaCore</a>&lt;Shape_, WarpShape_, <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;1, 1, 4&gt;, int8_t,</div><div class="line"><a name="l01220"></a><span class="lineno"> 1220</span>&#160;                      layout::ColumnMajor, int8_t, <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>, ElementC_,</div><div class="line"><a name="l01221"></a><span class="lineno"> 1221</span>&#160;                      LayoutC_, arch::OpClassSimt, 2, Operator_</div><div class="line"><a name="l01222"></a><span class="lineno"> 1222</span>&#160;                      &gt; {</div><div class="line"><a name="l01223"></a><span class="lineno"> 1223</span>&#160;</div><div class="line"><a name="l01224"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a03d48dfe750df22f2d071cf070583cbb"> 1224</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a03d48dfe750df22f2d071cf070583cbb">Shape</a> = Shape_;</div><div class="line"><a name="l01225"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a98ba20cab0956012d15431f330c4c859"> 1225</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a98ba20cab0956012d15431f330c4c859">WarpShape</a> = WarpShape_;</div><div class="line"><a name="l01226"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a2884fa009363296f7404872e354925ad"> 1226</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">InstructionShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape&lt;1, 1, 4&gt;</a>;</div><div class="line"><a name="l01227"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a3a75e1314b7965cbed6d4d78d0d681ef"> 1227</a></span>&#160;  <span class="keyword">using</span> ElementA = int8_t;</div><div class="line"><a name="l01228"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#af221f78897173f9b8c641b3423ff9568"> 1228</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutA</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l01229"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#ada3c2e042a4acfc4bce6f0b7de7bbeaf"> 1229</a></span>&#160;  <span class="keyword">using</span> ElementB = int8_t;</div><div class="line"><a name="l01230"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#ad74d9da21f4555f6181837e64a7450dc"> 1230</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">LayoutB</a> = <a class="code" href="classcutlass_1_1layout_1_1ColumnMajor.html">layout::ColumnMajor</a>;</div><div class="line"><a name="l01231"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a200b038225aabe5eedd7931814d27a44"> 1231</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a200b038225aabe5eedd7931814d27a44">ElementC</a> = ElementC_;</div><div class="line"><a name="l01232"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#acc5cd244b86a03c2b8dd57b01545fbe8"> 1232</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#acc5cd244b86a03c2b8dd57b01545fbe8">LayoutC</a> = LayoutC_;</div><div class="line"><a name="l01233"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#ac2bc54c65c50ee88b7ac877c2c8469a9"> 1233</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#ac2bc54c65c50ee88b7ac877c2c8469a9">OperatorClass</a> = arch::OpClassSimt;</div><div class="line"><a name="l01234"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a31f2cf101f49b119db8e04da688144c1"> 1234</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> PartitionsK = Shape::kK / WarpShape::kK;</div><div class="line"><a name="l01235"></a><span class="lineno"> 1235</span>&#160;</div><div class="line"><a name="l01237"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a0d137c48ec0b4323a153c3a960322687"> 1237</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a0d137c48ec0b4323a153c3a960322687">Operator</a> = Operator_;</div><div class="line"><a name="l01238"></a><span class="lineno"> 1238</span>&#160;</div><div class="line"><a name="l01240"></a><span class="lineno"> 1240</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">WarpCount</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">GemmShape</a>&lt;</div><div class="line"><a name="l01241"></a><span class="lineno"> 1241</span>&#160;    Shape::kM / WarpShape::kM,</div><div class="line"><a name="l01242"></a><span class="lineno"> 1242</span>&#160;    Shape::kN / WarpShape::kN,</div><div class="line"><a name="l01243"></a><span class="lineno"> 1243</span>&#160;    PartitionsK</div><div class="line"><a name="l01244"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a1c7409f763449fb1f82ccbe55de4b663"> 1244</a></span>&#160;  &gt;;</div><div class="line"><a name="l01245"></a><span class="lineno"> 1245</span>&#160;</div><div class="line"><a name="l01246"></a><span class="lineno"> 1246</span>&#160;  <span class="comment">// Divisility requirements</span></div><div class="line"><a name="l01247"></a><span class="lineno"> 1247</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(</div><div class="line"><a name="l01248"></a><span class="lineno"> 1248</span>&#160;    !(Shape::kM % WarpShape::kM) &amp;&amp;</div><div class="line"><a name="l01249"></a><span class="lineno"> 1249</span>&#160;    !(Shape::kN % WarpShape::kN),</div><div class="line"><a name="l01250"></a><span class="lineno"> 1250</span>&#160;    <span class="stringliteral">&quot;Threadblock-scoped GEMM should be divisible by warp-scoped GEMM size.&quot;</span></div><div class="line"><a name="l01251"></a><span class="lineno"> 1251</span>&#160;  );</div><div class="line"><a name="l01252"></a><span class="lineno"> 1252</span>&#160;</div><div class="line"><a name="l01254"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#acfa25506e0870c822e4c5c452b7091f1"> 1254</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kWarpSize = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">warp::WarpSize&lt;arch::OpClassSimt&gt;::value</a>;</div><div class="line"><a name="l01255"></a><span class="lineno"> 1255</span>&#160;</div><div class="line"><a name="l01257"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a39e0c6bd96f947e0db63fae49ba267bf"> 1257</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kThreads = WarpCount::kCount * kWarpSize;</div><div class="line"><a name="l01258"></a><span class="lineno"> 1258</span>&#160;</div><div class="line"><a name="l01259"></a><span class="lineno"> 1259</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01260"></a><span class="lineno"> 1260</span>&#160;  <span class="comment">// Shared memory layouts</span></div><div class="line"><a name="l01261"></a><span class="lineno"> 1261</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01262"></a><span class="lineno"> 1262</span>&#160;</div><div class="line"><a name="l01263"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#afcad699188815cf0da13651c5d53fa53"> 1263</a></span>&#160;  <span class="keyword">using</span> SmemLayoutA = <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">layout::ColumnMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l01264"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a86618fb8ff54b76f5499f0b3531b95cf"> 1264</a></span>&#160;  <span class="keyword">using</span> SmemLayoutB = <a class="code" href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">layout::RowMajorInterleaved&lt;4&gt;</a>;</div><div class="line"><a name="l01265"></a><span class="lineno"> 1265</span>&#160;</div><div class="line"><a name="l01266"></a><span class="lineno"> 1266</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01267"></a><span class="lineno"> 1267</span>&#160;  <span class="comment">// Iterators to write to shared memory</span></div><div class="line"><a name="l01268"></a><span class="lineno"> 1268</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01269"></a><span class="lineno"> 1269</span>&#160;</div><div class="line"><a name="l01271"></a><span class="lineno"> 1271</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapA</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l01272"></a><span class="lineno"> 1272</span>&#160;    layout::PitchLinearShape&lt;Shape::kM, Shape::kK&gt;,</div><div class="line"><a name="l01273"></a><span class="lineno"> 1273</span>&#160;    kThreads,</div><div class="line"><a name="l01274"></a><span class="lineno"> 1274</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l01275"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a368fe0ace8f4cfcfd886af813344a225"> 1275</a></span>&#160;  &gt;;</div><div class="line"><a name="l01276"></a><span class="lineno"> 1276</span>&#160;</div><div class="line"><a name="l01278"></a><span class="lineno"> 1278</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorA</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l01279"></a><span class="lineno"> 1279</span>&#160;    MatrixShape&lt;Shape::kM, Shape::kK&gt;, </div><div class="line"><a name="l01280"></a><span class="lineno"> 1280</span>&#160;    ElementA, </div><div class="line"><a name="l01281"></a><span class="lineno"> 1281</span>&#160;    SmemLayoutA,</div><div class="line"><a name="l01282"></a><span class="lineno"> 1282</span>&#160;    1,</div><div class="line"><a name="l01283"></a><span class="lineno"> 1283</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapA</a></div><div class="line"><a name="l01284"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#ad7fc5a854a66bb8f5bb59820f5d52dea"> 1284</a></span>&#160;  &gt;;</div><div class="line"><a name="l01285"></a><span class="lineno"> 1285</span>&#160;  </div><div class="line"><a name="l01286"></a><span class="lineno"> 1286</span>&#160;</div><div class="line"><a name="l01288"></a><span class="lineno"> 1288</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">IteratorThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">transform::PitchLinear2DThreadTileStripminedThreadMap</a>&lt;</div><div class="line"><a name="l01289"></a><span class="lineno"> 1289</span>&#160;    layout::PitchLinearShape&lt;Shape::kK, Shape::kN&gt;,</div><div class="line"><a name="l01290"></a><span class="lineno"> 1290</span>&#160;    kThreads,</div><div class="line"><a name="l01291"></a><span class="lineno"> 1291</span>&#160;    <a class="code" href="structcutlass_1_1layout_1_1PitchLinearShape.html">layout::PitchLinearShape&lt;4, 4&gt;</a></div><div class="line"><a name="l01292"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a50e3846c0e25e25e81bdbfbacd44106c"> 1292</a></span>&#160;  &gt;;</div><div class="line"><a name="l01293"></a><span class="lineno"> 1293</span>&#160;</div><div class="line"><a name="l01295"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a38e6f8e2651575a3c6f8f6f7a43e9722"> 1295</a></span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapB</a> = <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">transform::TransposePitchLinearThreadMap2DThreadTile&lt;IteratorThreadMapB&gt;</a>;</div><div class="line"><a name="l01296"></a><span class="lineno"> 1296</span>&#160;</div><div class="line"><a name="l01298"></a><span class="lineno"> 1298</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">SmemIteratorB</a> = <a class="code" href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">transform::threadblock::RegularTileIterator2dThreadTile</a>&lt;</div><div class="line"><a name="l01299"></a><span class="lineno"> 1299</span>&#160;    MatrixShape&lt;Shape::kK, Shape::kN&gt;, </div><div class="line"><a name="l01300"></a><span class="lineno"> 1300</span>&#160;    ElementB, </div><div class="line"><a name="l01301"></a><span class="lineno"> 1301</span>&#160;    SmemLayoutB,</div><div class="line"><a name="l01302"></a><span class="lineno"> 1302</span>&#160;    0,</div><div class="line"><a name="l01303"></a><span class="lineno"> 1303</span>&#160;    <a class="code" href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">SmemThreadMapB</a></div><div class="line"><a name="l01304"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a03744ff93e49baba4b58019bd775c451"> 1304</a></span>&#160;  &gt;;</div><div class="line"><a name="l01305"></a><span class="lineno"> 1305</span>&#160;</div><div class="line"><a name="l01306"></a><span class="lineno"> 1306</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01307"></a><span class="lineno"> 1307</span>&#160;  <span class="comment">// Warp-level matrix multiply operator</span></div><div class="line"><a name="l01308"></a><span class="lineno"> 1308</span>&#160;  <span class="comment">//</span></div><div class="line"><a name="l01309"></a><span class="lineno"> 1309</span>&#160;</div><div class="line"><a name="l01310"></a><span class="lineno"> 1310</span>&#160;  <span class="comment">// Define the warp-level op</span></div><div class="line"><a name="l01311"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a66b5772dc62d37fbf3a7e36a6efc9fb5"> 1311</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsM = detail::simt_get_warp_threads_m&lt;WarpShape&gt;();</div><div class="line"><a name="l01312"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a365fdf65e1519f787bdf582b7cf5461c"> 1312</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> WarpNumThreadsN = kWarpSize / WarpNumThreadsM;</div><div class="line"><a name="l01313"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a9d692b8e79fbd197ae4f6be078924e1d"> 1313</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileM = WarpShape::kM / WarpNumThreadsM;</div><div class="line"><a name="l01314"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#aee51bbe7714fd9a58b6c1d0306039328"> 1314</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> ThreadTileN = WarpShape::kN / WarpNumThreadsN;</div><div class="line"><a name="l01315"></a><span class="lineno"> 1315</span>&#160;  <a class="code" href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a>(!(WarpShape::kM % WarpNumThreadsM) &amp;&amp; !(WarpShape::kN % WarpNumThreadsN),</div><div class="line"><a name="l01316"></a><span class="lineno"> 1316</span>&#160;      <span class="stringliteral">&quot;WarpShape must be divisible by ThreadTile shape.&quot;</span>);</div><div class="line"><a name="l01317"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#af50d71b203779b393dc572c379bc06e8"> 1317</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneLayout = ThreadTileM &gt; 4 &amp;&amp; ThreadTileN &gt; 4 ? 2 : 1;</div><div class="line"><a name="l01318"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#add6ec30b9a987a0e314f9d2b90a55a89"> 1318</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsA = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>;</div><div class="line"><a name="l01319"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a6dfe65fe9621fcb4c1f1dd7e74e963a5"> 1319</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> numElementsB = 128 / <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>;</div><div class="line"><a name="l01320"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a02a9cf5168ad4317406a71eb9934dd43"> 1320</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneM = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileM);</div><div class="line"><a name="l01321"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a6b6a46649ec06c088f45806d8410de41"> 1321</a></span>&#160;  <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">int</span> LaneN = <a class="code" href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a>(4, ThreadTileN);</div><div class="line"><a name="l01322"></a><span class="lineno"> 1322</span>&#160;  <span class="comment">// these should have max of thread tile also</span></div><div class="line"><a name="l01323"></a><span class="lineno"> 1323</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a> = <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a>&lt;</div><div class="line"><a name="l01324"></a><span class="lineno"> 1324</span>&#160;      LaneM,</div><div class="line"><a name="l01325"></a><span class="lineno"> 1325</span>&#160;      LaneN,</div><div class="line"><a name="l01326"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a154a5c15eeed1313f05522a9e4474791"> 1326</a></span>&#160;      4&gt;;</div><div class="line"><a name="l01327"></a><span class="lineno"> 1327</span>&#160;</div><div class="line"><a name="l01328"></a><span class="lineno"> 1328</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a> = <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a>&lt;</div><div class="line"><a name="l01329"></a><span class="lineno"> 1329</span>&#160;      <a class="code" href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape&lt;WarpNumThreadsM, WarpNumThreadsN&gt;</a>,   <span class="comment">// WarpShape</span></div><div class="line"><a name="l01330"></a><span class="lineno"> 1330</span>&#160;      <a class="code" href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">cutlass::layout::ColumnMajorInterleaved&lt;LaneLayout&gt;</a>,         <span class="comment">// LaneLayout</span></div><div class="line"><a name="l01331"></a><span class="lineno"> 1331</span>&#160;      <a class="code" href="structcutlass_1_1gemm_1_1GemmShape.html">LaneMmaShape</a></div><div class="line"><a name="l01332"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a346489e42e33dc95e7568793d43c5c64"> 1332</a></span>&#160;  &gt;;</div><div class="line"><a name="l01333"></a><span class="lineno"> 1333</span>&#160;</div><div class="line"><a name="l01334"></a><span class="lineno"> 1334</span>&#160;  <span class="keyword">using</span> <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a> = <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a>&lt;</div><div class="line"><a name="l01335"></a><span class="lineno"> 1335</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a98ba20cab0956012d15431f330c4c859">WarpShape</a>,    </div><div class="line"><a name="l01336"></a><span class="lineno"> 1336</span>&#160;    ElementA,     </div><div class="line"><a name="l01337"></a><span class="lineno"> 1337</span>&#160;    SmemLayoutA,  </div><div class="line"><a name="l01338"></a><span class="lineno"> 1338</span>&#160;    ElementB,     </div><div class="line"><a name="l01339"></a><span class="lineno"> 1339</span>&#160;    SmemLayoutB,  </div><div class="line"><a name="l01340"></a><span class="lineno"> 1340</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a200b038225aabe5eedd7931814d27a44">ElementC</a>,     </div><div class="line"><a name="l01341"></a><span class="lineno"> 1341</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#acc5cd244b86a03c2b8dd57b01545fbe8">LayoutC</a>,      </div><div class="line"><a name="l01342"></a><span class="lineno"> 1342</span>&#160;    <a class="code" href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">Policy</a>,       </div><div class="line"><a name="l01343"></a><span class="lineno"> 1343</span>&#160;    PartitionsK   </div><div class="line"><a name="l01344"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a99137700de654a22fea6d9cdc8f09866"> 1344</a></span>&#160;    &gt;;</div><div class="line"><a name="l01345"></a><span class="lineno"> 1345</span>&#160;</div><div class="line"><a name="l01346"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a5ce49840c5cc218cafac8469f7f88332"> 1346</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingM = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementA&gt;::value</a>);</div><div class="line"><a name="l01347"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a97f871d9a198b28a18c49ce039039c7e"> 1347</a></span>&#160;  <span class="keyword">static</span> <span class="keywordtype">int</span> <span class="keyword">const</span> kPaddingN = <a class="code" href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">detail::simt_transpose_padding</a>(kWarpSize, Shape::kK, <a class="code" href="structcutlass_1_1sizeof__bits.html">sizeof_bits&lt;ElementB&gt;::value</a>);</div><div class="line"><a name="l01348"></a><span class="lineno"> 1348</span>&#160;</div><div class="line"><a name="l01350"></a><span class="lineno"> 1350</span>&#160;  <span class="keyword">using</span> <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a520a725ea60dc096d0cdf0e101d0e547">MmaPolicy</a> = <a class="code" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a520a725ea60dc096d0cdf0e101d0e547">MmaPolicy</a>&lt;</div><div class="line"><a name="l01351"></a><span class="lineno"> 1351</span>&#160;    <a class="code" href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">MmaWarpSimt</a>,</div><div class="line"><a name="l01352"></a><span class="lineno"> 1352</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, 0&gt;</a>,</div><div class="line"><a name="l01353"></a><span class="lineno"> 1353</span>&#160;    <a class="code" href="structcutlass_1_1MatrixShape.html">MatrixShape&lt;0, kPaddingN&gt;</a>,</div><div class="line"><a name="l01354"></a><span class="lineno"> 1354</span>&#160;    WarpCount::kK</div><div class="line"><a name="l01355"></a><span class="lineno"><a class="line" href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a520a725ea60dc096d0cdf0e101d0e547"> 1355</a></span>&#160;  &gt;;</div><div class="line"><a name="l01356"></a><span class="lineno"> 1356</span>&#160;};</div><div class="line"><a name="l01357"></a><span class="lineno"> 1357</span>&#160;</div><div class="line"><a name="l01358"></a><span class="lineno"> 1358</span>&#160;} <span class="comment">// namespace threadblock</span></div><div class="line"><a name="l01359"></a><span class="lineno"> 1359</span>&#160;} <span class="comment">// namespace gemm</span></div><div class="line"><a name="l01360"></a><span class="lineno"> 1360</span>&#160;} <span class="comment">// namespace cutlass</span></div><div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52_html_acdc66d5a5d190e94e0562eed3d3ddf30"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#acdc66d5a5d190e94e0562eed3d3ddf30">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:756</div></div>
<div class="ttc" id="mma__simt__policy_8h_html"><div class="ttname"><a href="mma__simt__policy_8h.html">mma_simt_policy.h</a></div><div class="ttdoc">Describes the lane policy used by warp-level matrix multiply operators targeting SIMT instructions...</div></div>
<div class="ttc" id="structcutlass_1_1MatrixShape_html"><div class="ttname"><a href="structcutlass_1_1MatrixShape.html">cutlass::MatrixShape</a></div><div class="ttdoc">Describes the size of a matrix tile. </div><div class="ttdef"><b>Definition:</b> matrix_shape.h:42</div></div>
<div class="ttc" id="regular__tile__iterator__pitch__linear_8h_html"><div class="ttname"><a href="regular__tile__iterator__pitch__linear_8h.html">regular_tile_iterator_pitch_linear.h</a></div><div class="ttdoc">Templates implementing loading of tiles from pitch-linear rank=2 tensors. </div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067_html_aabe20df5c98890c82bdd20c351fb9709"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aabe20df5c98890c82bdd20c351fb9709">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; kPaddingM, 0 &gt;, MatrixShape&lt; 0, 0 &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Policy used to define MmaPipelined. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1195</div></div>
<div class="ttc" id="namespacecutlass_html"><div class="ttname"><a href="namespacecutlass.html">cutlass</a></div><div class="ttdef"><b>Definition:</b> aligned_buffer.h:35</div></div>
<div class="ttc" id="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap_html"><div class="ttname"><a href="structcutlass_1_1transform_1_1PitchLinear2DThreadTileStripminedThreadMap.html">cutlass::transform::PitchLinear2DThreadTileStripminedThreadMap</a></div><div class="ttdef"><b>Definition:</b> pitch_linear_thread_map.h:623</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_af0afef329d873475ac2a4eba05bd943c"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af0afef329d873475ac2a4eba05bd943c">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementA</a></div><div class="ttdeci">ElementA_ ElementA</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:108</div></div>
<div class="ttc" id="platform_8h_html_a72f0657181cca64b44eb186b707eb380"><div class="ttname"><a href="platform_8h.html#a72f0657181cca64b44eb186b707eb380">constexpr</a></div><div class="ttdeci">#define constexpr</div><div class="ttdef"><b>Definition:</b> platform.h:137</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7_html_a6a1ad914c597f2ced6ddb356516a1413"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a6a1ad914c597f2ced6ddb356516a1413">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:435</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1warp_1_1WarpSize_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1warp_1_1WarpSize.html">cutlass::gemm::warp::WarpSize</a></div><div class="ttdoc">Query the number of threads per warp. </div><div class="ttdef"><b>Definition:</b> gemm/warp/mma.h:43</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52_html_afe290c0c2c5dc44ca2f7b73d93f9fe6f"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#afe290c0c2c5dc44ca2f7b73d93f9fe6f">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:755</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore.html">cutlass::gemm::threadblock::DefaultMmaCore</a></div><div class="ttdef"><b>Definition:</b> default_mma_core.h:90</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0_html_a62de2763f572e5a71e9587f49d0905e6"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a62de2763f572e5a71e9587f49d0905e6">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; 0, 0 &gt;, MatrixShape&lt; 0, kPaddingN &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Policy used to define MmaPipelined. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:719</div></div>
<div class="ttc" id="pitch__linear__thread__map_8h_html"><div class="ttname"><a href="pitch__linear__thread__map_8h.html">pitch_linear_thread_map.h</a></div><div class="ttdoc">Templates implementing how threads are mapped to a given tile. </div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345_html_a98ba20cab0956012d15431f330c4c859"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a98ba20cab0956012d15431f330c4c859">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1225</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345_html_acc5cd244b86a03c2b8dd57b01545fbe8"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#acc5cd244b86a03c2b8dd57b01545fbe8">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1232</div></div>
<div class="ttc" id="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt_html"><div class="ttname"><a href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMapSimt.html">cutlass::transform::TransposePitchLinearThreadMapSimt</a></div><div class="ttdef"><b>Definition:</b> pitch_linear_thread_map.h:431</div></div>
<div class="ttc" id="classcutlass_1_1gemm_1_1warp_1_1MmaSimt_html"><div class="ttname"><a href="classcutlass_1_1gemm_1_1warp_1_1MmaSimt.html">cutlass::gemm::warp::MmaSimt</a></div><div class="ttdoc">Structure to compute the matrix product targeting CUDA cores and SIMT math instructions. </div><div class="ttdef"><b>Definition:</b> mma_simt.h:74</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52_html_a03ef3ea08d70d25e222ee0339afa1e0a"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a03ef3ea08d70d25e222ee0339afa1e0a">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:749</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345_html_a0d137c48ec0b4323a153c3a960322687"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a0d137c48ec0b4323a153c3a960322687">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1237</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067_html_a373439df9ac285ab153ac52d1953e8d4"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#a373439df9ac285ab153ac52d1953e8d4">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1078</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067_html_af274c0fe139375dd34d0ea3dfbaf9703"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af274c0fe139375dd34d0ea3dfbaf9703">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1074</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7_html_a19213bcaeaf5e7746176526f7c57de32"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a19213bcaeaf5e7746176526f7c57de32">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:436</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_a926109870af5f4d9120ce5c98bbed2b6"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a926109870af5f4d9120ce5c98bbed2b6">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:113</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52_html_af0d7f0f10f163b0191cebf5e920dfed3"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#af0d7f0f10f163b0191cebf5e920dfed3">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:761</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc_html_ae3de45321d07b5b45e17b1ba7ff136ce"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ae3de45321d07b5b45e17b1ba7ff136ce">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:910</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067_html_af7b416c742dacf93ab522a40699c6c71"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#af7b416c742dacf93ab522a40699c6c71">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1073</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc_html_a3bd2c938edb75c58d6b0d9f5f9970239"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a3bd2c938edb75c58d6b0d9f5f9970239">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:902</div></div>
<div class="ttc" id="classcutlass_1_1layout_1_1ColumnMajor_html"><div class="ttname"><a href="classcutlass_1_1layout_1_1ColumnMajor.html">cutlass::layout::ColumnMajor</a></div><div class="ttdoc">Mapping function for column-major matrices. </div><div class="ttdef"><b>Definition:</b> layout/matrix.h:142</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_a1d91b3f73b2941d84499f28f38b2fcfb"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a1d91b3f73b2941d84499f28f38b2fcfb">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:114</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1PitchLinearShape_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1PitchLinearShape.html">cutlass::layout::PitchLinearShape</a></div><div class="ttdoc">Template defining a shape used by pitch-linear operators. </div><div class="ttdef"><b>Definition:</b> pitch_linear.h:43</div></div>
<div class="ttc" id="array_8h_html"><div class="ttname"><a href="array_8h.html">array.h</a></div><div class="ttdoc">Statically sized array of elements that accommodates all CUTLASS-supported numeric types and is safe ...</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7_html_ab593ff2fb5b33cc946b19aab6b1e64bf"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#ab593ff2fb5b33cc946b19aab6b1e64bf">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:270</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52_html_af00303b35d278e533aaf3ae3ba82d017"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#af00303b35d278e533aaf3ae3ba82d017">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:748</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1warp_1_1MmaSimtPolicy.html">cutlass::gemm::warp::MmaSimtPolicy</a></div><div class="ttdoc">Describes the arrangement and configuration of per-lane operations in warp-level matrix multiply...</div><div class="ttdef"><b>Definition:</b> mma_simt_policy.h:46</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52_html_aada86baebc846e6614f3616688477fba"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#aada86baebc846e6614f3616688477fba">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; 0, 0 &gt;, MatrixShape&lt; 0, 0 &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Policy used to define MmaPipelined. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:873</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_af8139bed1d2a3d23e9d4e1790a058d01"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#af8139bed1d2a3d23e9d4e1790a058d01">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:106</div></div>
<div class="ttc" id="matrix__shape_8h_html"><div class="ttname"><a href="matrix__shape_8h.html">matrix_shape.h</a></div><div class="ttdoc">Defines a Shape template for matrix tiles. </div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345_html_a200b038225aabe5eedd7931814d27a44"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a200b038225aabe5eedd7931814d27a44">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1231</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_a43fa0507a4d4bd8ca7df069858f910e6"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a43fa0507a4d4bd8ca7df069858f910e6">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:105</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc_html_ad8f801b18df3a58f83aa5e8ce325fcf6"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ad8f801b18df3a58f83aa5e8ce325fcf6">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; kPaddingM, 0 &gt;, MatrixShape&lt; 0, kPaddingN &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Policy used to define MmaPipelined. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1036</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7_html_a1bc7903bc348e342702a6f7e314be337"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a1bc7903bc348e342702a6f7e314be337">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:262</div></div>
<div class="ttc" id="structcutlass_1_1sizeof__bits_html"><div class="ttname"><a href="structcutlass_1_1sizeof__bits.html">cutlass::sizeof_bits</a></div><div class="ttdoc">Defines the size of an element in bits. </div><div class="ttdef"><b>Definition:</b> numeric_types.h:42</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345_html_ac2bc54c65c50ee88b7ac877c2c8469a9"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#ac2bc54c65c50ee88b7ac877c2c8469a9">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1233</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0_html_aeb7ff4ca2dd952e411f92e8628d6c015"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#aeb7ff4ca2dd952e411f92e8628d6c015">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:597</div></div>
<div class="ttc" id="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile_html"><div class="ttname"><a href="structcutlass_1_1transform_1_1TransposePitchLinearThreadMap2DThreadTile.html">cutlass::transform::TransposePitchLinearThreadMap2DThreadTile</a></div><div class="ttdoc">Thread Mapping a 2D threadtiled mapping as a transposed Pitchlinear2DThreadTile mapping. </div><div class="ttdef"><b>Definition:</b> pitch_linear_thread_map.h:713</div></div>
<div class="ttc" id="default__mma__core_8h_html"><div class="ttname"><a href="default__mma__core_8h.html">default_mma_core.h</a></div><div class="ttdoc">Defines basic properties needed by CTA-level GEMMs assuming expectations about data layout of the glo...</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7_html_aea4174e3f2e32dcd170dea50d5675369"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aea4174e3f2e32dcd170dea50d5675369">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:434</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc_html_a9e0ab047c9957fc0e3ce232e98c91a7e"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#a9e0ab047c9957fc0e3ce232e98c91a7e">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:903</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_aa63507fa81a746d9d88363a977018c8b"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aa63507fa81a746d9d88363a977018c8b">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:118</div></div>
<div class="ttc" id="numeric__types_8h_html"><div class="ttname"><a href="numeric__types_8h.html">numeric_types.h</a></div><div class="ttdoc">Top-level include for all CUTLASS numeric types. </div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1GemmShape_html"><div class="ttname"><a href="structcutlass_1_1gemm_1_1GemmShape.html">cutlass::gemm::GemmShape</a></div><div class="ttdoc">Shape of a matrix multiply-add operation. </div><div class="ttdef"><b>Definition:</b> include/cutlass/gemm/gemm.h:57</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator_html"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator.html">cutlass::transform::threadblock::RegularTileIterator</a></div><div class="ttdef"><b>Definition:</b> regular_tile_iterator.h:50</div></div>
<div class="ttc" id="platform_8h_html_adde4c9ea91b753491851361a4198c009"><div class="ttname"><a href="platform_8h.html#adde4c9ea91b753491851361a4198c009">static_assert</a></div><div class="ttdeci">#define static_assert(__e, __m)</div><div class="ttdef"><b>Definition:</b> platform.h:153</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0_html_a717f638b194fbbc0692ddd94282a6724"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a717f638b194fbbc0692ddd94282a6724">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:602</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7_html_aca4a8b44fb78de382813bd3bda11f5ce"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#aca4a8b44fb78de382813bd3bda11f5ce">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:428</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067_html_ad3fce3b8a477190dc5d335b549b12c85"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ad3fce3b8a477190dc5d335b549b12c85">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1072</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0_html_abb9841f9f90c868e9ec2ee0b19295534"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#abb9841f9f90c868e9ec2ee0b19295534">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:598</div></div>
<div class="ttc" id="namespacecutlass_1_1gemm_1_1threadblock_1_1detail_html_a16d673aabb47b0d09f506197bf65e240"><div class="ttname"><a href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a16d673aabb47b0d09f506197bf65e240">cutlass::gemm::threadblock::detail::simt_transpose_padding</a></div><div class="ttdeci">constexpr int simt_transpose_padding(int threads, int crosswise, int size_in_bits)</div><div class="ttdoc">Computes padding in shared memory to perform efficient transpose without bank conflicts. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:67</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067_html_aa62154dc21ce92b46887cefe5fcf3054"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#aa62154dc21ce92b46887cefe5fcf3054">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1066</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7_html_a6c7b4a920e6d2ab6cf53d51dc410f74f"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a6c7b4a920e6d2ab6cf53d51dc410f74f">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:261</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0_html_adec0b67751d581deb517b0eaf74cc6f1"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#adec0b67751d581deb517b0eaf74cc6f1">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:589</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345_html_a520a725ea60dc096d0cdf0e101d0e547"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a520a725ea60dc096d0cdf0e101d0e547">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; 0, 0 &gt;, MatrixShape&lt; 0, kPaddingN &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Policy used to define MmaPipelined. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1355</div></div>
<div class="ttc" id="regular__tile__iterator__pitch__linear__2dthreadtile_8h_html"><div class="ttname"><a href="regular__tile__iterator__pitch__linear__2dthreadtile_8h.html">regular_tile_iterator_pitch_linear_2dthreadtile.h</a></div><div class="ttdoc">Templates implementing loading of tiles from pitch-linear rank=2 tensors. </div></div>
<div class="ttc" id="classcutlass_1_1layout_1_1RowMajor_html"><div class="ttname"><a href="classcutlass_1_1layout_1_1RowMajor.html">cutlass::layout::RowMajor</a></div><div class="ttdoc">Mapping function for row-major matrices. </div><div class="ttdef"><b>Definition:</b> layout/matrix.h:50</div></div>
<div class="ttc" id="namespacecutlass_1_1gemm_1_1threadblock_1_1detail_html_a69a9003a33867ce73f81c37b7414c915"><div class="ttname"><a href="namespacecutlass_1_1gemm_1_1threadblock_1_1detail.html#a69a9003a33867ce73f81c37b7414c915">cutlass::gemm::threadblock::detail::simt_get_warp_threads_m</a></div><div class="ttdeci">constexpr int simt_get_warp_threads_m()</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:62</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc_html_ade835163d1fac35dce14031c37bebb96"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ade835163d1fac35dce14031c37bebb96">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:909</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_a562143e6b199064cd539bde597ec3999"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a562143e6b199064cd539bde597ec3999">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:112</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067_html_ac013076a3c9380a79407ad708ac09eb3"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha863d4139ccaa713bc4bde32c425f4067.html#ac013076a3c9380a79407ad708ac09eb3">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1065</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_a05d5677b44fd111bfe6ebcc6fb7d1676"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#a05d5677b44fd111bfe6ebcc6fb7d1676">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; 0, 0 &gt;, MatrixShape&lt; 0, 0 &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Used for partial specialization. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:229</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc_html_ac694a206c028c5e55610f6477da8ed94"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ac694a206c028c5e55610f6477da8ed94">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:911</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0_html_a70b15ab8005a28399d5f516545fc7a7c"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a70b15ab8005a28399d5f516545fc7a7c">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:596</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7_html_a08ebcc80c20f997c2e9385eeb8004b26"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#a08ebcc80c20f997c2e9385eeb8004b26">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:440</div></div>
<div class="ttc" id="fast__math_8h_html"><div class="ttname"><a href="fast__math_8h.html">fast_math.h</a></div><div class="ttdoc">Math utilities. </div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1ColumnMajorInterleaved_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1ColumnMajorInterleaved.html">cutlass::layout::ColumnMajorInterleaved&lt; 4 &gt;</a></div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7_html_a19db74df10235f4d5e36518bac33b4c6"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a19db74df10235f4d5e36518bac33b4c6">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; kPaddingN, 0 &gt;, MatrixShape&lt; 0, kPaddingN &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Policy used to define MmaPipelined. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:395</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7_html_ac514eda9ab5d8a522bf444f9f415d361"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#ac514eda9ab5d8a522bf444f9f415d361">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:427</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092_html_aaf221ce787e11cf3edcb49fc2afec46d"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShafafd5c61db86cbfe90863578ddd11092.html#aaf221ce787e11cf3edcb49fc2afec46d">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementB</a></div><div class="ttdeci">ElementB_ ElementB</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:110</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7_html_a85f9b714299218c989d6bd1b48166758"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a85f9b714299218c989d6bd1b48166758">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::ElementC</a></div><div class="ttdeci">ElementC_ ElementC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:268</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7_html_a812562a7feb033d7c554ab6d86c30388"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#a812562a7feb033d7c554ab6d86c30388">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:274</div></div>
<div class="ttc" id="mma__simt_8h_html"><div class="ttname"><a href="mma__simt_8h.html">mma_simt.h</a></div><div class="ttdoc">Templates implementing warp-level matrix multiply-accumulate operations. </div></div>
<div class="ttc" id="namespacecutlass_html_a1676e17a7fea0ac40d9d239cbd3ce872"><div class="ttname"><a href="namespacecutlass.html#a1676e17a7fea0ac40d9d239cbd3ce872">cutlass::const_min</a></div><div class="ttdeci">CUTLASS_HOST_DEVICE constexpr int const_min(int a, int b)</div><div class="ttdef"><b>Definition:</b> fast_math.h:219</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc_html_ab9073ff38dd4579f65b461f887d8e9f6"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShaaf312aafe9da92ea9d417bcc12a8e7dc.html#ab9073ff38dd4579f65b461f887d8e9f6">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::RowMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Operator</a></div><div class="ttdeci">Operator_ Operator</div><div class="ttdoc">Default Operator. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:915</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7_html_af2c71eb39f54a898753b9ff25e6f3072"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha84e9f8afb6a4ca9f5dcd219b182d16e7.html#af2c71eb39f54a898753b9ff25e6f3072">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::MmaPolicy</a></div><div class="ttdeci">MmaPolicy&lt; MmaWarpSimt, MatrixShape&lt; kPaddingM, 0 &gt;, MatrixShape&lt; 0, 0 &gt;, WarpCount::kK &gt; MmaPolicy</div><div class="ttdoc">Policy used to define MmaPipelined. </div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:557</div></div>
<div class="ttc" id="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile_html"><div class="ttname"><a href="classcutlass_1_1transform_1_1threadblock_1_1RegularTileIterator2dThreadTile.html">cutlass::transform::threadblock::RegularTileIterator2dThreadTile</a></div><div class="ttdef"><b>Definition:</b> regular_tile_iterator_pitch_linear_2dthreadtile.h:59</div></div>
<div class="ttc" id="cutlass_8h_html"><div class="ttname"><a href="cutlass_8h.html">cutlass.h</a></div><div class="ttdoc">Basic include for CUTLASS. </div></div>
<div class="ttc" id="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap_html"><div class="ttname"><a href="structcutlass_1_1transform_1_1PitchLinearStripminedThreadMap.html">cutlass::transform::PitchLinearStripminedThreadMap</a></div><div class="ttdef"><b>Definition:</b> pitch_linear_thread_map.h:59</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7_html_abbf4045091090bcaf32905afaefb01c5"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha8da7a0cfbbe859b701fdd9f2b8566aa7.html#abbf4045091090bcaf32905afaefb01c5">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::RowMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::LayoutC</a></div><div class="ttdeci">LayoutC_ LayoutC</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:269</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52_html_a63a2d785d9fa1e0373378b9801aec228"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha34a52cc7b2942e8c290f0032b6779b52.html#a63a2d785d9fa1e0373378b9801aec228">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::RowMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::OperatorClass</a></div><div class="ttdeci">arch::OpClassSimt OperatorClass</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:757</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345_html_a03d48dfe750df22f2d071cf070583cbb"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmSha2c0d0b7cdb5c4bcb11e83c058eb65345.html#a03d48dfe750df22f2d071cf070583cbb">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 4 &gt;, int8_t, layout::ColumnMajor, int8_t, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::Shape</a></div><div class="ttdeci">Shape_ Shape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:1224</div></div>
<div class="ttc" id="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0_html_a7030d7c50418f3b7bda8b6dbf594056f"><div class="ttname"><a href="structcutlass_1_1gemm_1_1threadblock_1_1DefaultMmaCore_3_01Shape___00_01WarpShape___00_01GemmShab94a11a77dd0565102710907089acee0.html#a7030d7c50418f3b7bda8b6dbf594056f">cutlass::gemm::threadblock::DefaultMmaCore&lt; Shape_, WarpShape_, GemmShape&lt; 1, 1, 1 &gt;, ElementA_, layout::ColumnMajor, ElementB_, layout::ColumnMajor, ElementC_, LayoutC_, arch::OpClassSimt, 2, Operator_ &gt;::WarpShape</a></div><div class="ttdeci">WarpShape_ WarpShape</div><div class="ttdef"><b>Definition:</b> default_mma_core_simt.h:590</div></div>
<div class="ttc" id="structcutlass_1_1layout_1_1RowMajorInterleaved_html"><div class="ttname"><a href="structcutlass_1_1layout_1_1RowMajorInterleaved.html">cutlass::layout::RowMajorInterleaved</a></div><div class="ttdef"><b>Definition:</b> layout/matrix.h:237</div></div>
</div><!-- fragment --></div><!-- contents -->
<!-- start footer part -->
<hr class="footer"/><address class="footer"><small>
Generated by &#160;<a href="http://www.doxygen.org/index.html">
<img class="footer" src="doxygen.png" alt="doxygen"/>
</a> 1.8.11
</small></address>
</body>
</html>
